{"id":"https://openalex.org/W7151501873","doi":"https://doi.org/10.1109/icmla66185.2025.00130","title":"Oracle-Guided Soft Shielding for Safe Move Prediction in Chess","display_name":"Oracle-Guided Soft Shielding for Safe Move Prediction in Chess","publication_year":2025,"publication_date":"2025-12-03","ids":{"openalex":"https://openalex.org/W7151501873","doi":"https://doi.org/10.1109/icmla66185.2025.00130"},"language":null,"primary_location":{"id":"doi:10.1109/icmla66185.2025.00130","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmla66185.2025.00130","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Machine Learning and Applications (ICMLA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133138106","display_name":"Prajit T Rajendran","orcid":null},"institutions":[{"id":"https://openalex.org/I2738703131","display_name":"Commissariat \u00e0 l'\u00c9nergie Atomique et aux \u00c9nergies Alternatives","ror":"https://ror.org/00jjx8s55","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131"]},{"id":"https://openalex.org/I277688954","display_name":"Universit\u00e9 Paris-Saclay","ror":"https://ror.org/03xjwb503","country_code":"FR","type":"education","lineage":["https://openalex.org/I277688954"]},{"id":"https://openalex.org/I4210085861","display_name":"Laboratoire d'Int\u00e9gration des Syst\u00e8mes et des Technologies","ror":"https://ror.org/000dbcc61","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131","https://openalex.org/I2738703131","https://openalex.org/I277688954","https://openalex.org/I4210085861","https://openalex.org/I4210117989"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Prajit T Rajendran","raw_affiliation_strings":["Universit&#x00E9; Paris-Saclay,CEA LIST,France"],"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; Paris-Saclay,CEA LIST,France","institution_ids":["https://openalex.org/I277688954","https://openalex.org/I2738703131","https://openalex.org/I4210085861"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083483449","display_name":"Fabio Arn\u00e9z","orcid":"https://orcid.org/0000-0003-0367-3035"},"institutions":[{"id":"https://openalex.org/I2738703131","display_name":"Commissariat \u00e0 l'\u00c9nergie Atomique et aux \u00c9nergies Alternatives","ror":"https://ror.org/00jjx8s55","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131"]},{"id":"https://openalex.org/I277688954","display_name":"Universit\u00e9 Paris-Saclay","ror":"https://ror.org/03xjwb503","country_code":"FR","type":"education","lineage":["https://openalex.org/I277688954"]},{"id":"https://openalex.org/I4210085861","display_name":"Laboratoire d'Int\u00e9gration des Syst\u00e8mes et des Technologies","ror":"https://ror.org/000dbcc61","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131","https://openalex.org/I2738703131","https://openalex.org/I277688954","https://openalex.org/I4210085861","https://openalex.org/I4210117989"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Fabio Arnez","raw_affiliation_strings":["Universit&#x00E9; Paris-Saclay,CEA LIST,France"],"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; Paris-Saclay,CEA LIST,France","institution_ids":["https://openalex.org/I277688954","https://openalex.org/I2738703131","https://openalex.org/I4210085861"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123073974","display_name":"Huascar Espinoza","orcid":null},"institutions":[{"id":"https://openalex.org/I4210137856","display_name":"Centre Hospitalier Interr\u00e9gional Edith Cavell","ror":"https://ror.org/03003by36","country_code":"BE","type":"healthcare","lineage":["https://openalex.org/I4210137856"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Huascar Espinoza","raw_affiliation_strings":["Chips JU,Brussels,Belgium"],"affiliations":[{"raw_affiliation_string":"Chips JU,Brussels,Belgium","institution_ids":["https://openalex.org/I4210137856"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009594268","display_name":"Agn\u00e8s Delaborde","orcid":"https://orcid.org/0000-0001-8882-4378"},"institutions":[{"id":"https://openalex.org/I4210107682","display_name":"Laboratoire National de M\u00e9trologie et d'Essais","ror":"https://ror.org/01ph39d13","country_code":"FR","type":"other","lineage":["https://openalex.org/I4210107682"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Agnes Delaborde","raw_affiliation_strings":["Laboratoire National de Metrologie et d&#x2019;Essais,France"],"affiliations":[{"raw_affiliation_string":"Laboratoire National de Metrologie et d&#x2019;Essais,France","institution_ids":["https://openalex.org/I4210107682"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063618543","display_name":"Chokri Mraidha","orcid":"https://orcid.org/0000-0003-2993-5734"},"institutions":[{"id":"https://openalex.org/I2738703131","display_name":"Commissariat \u00e0 l'\u00c9nergie Atomique et aux \u00c9nergies Alternatives","ror":"https://ror.org/00jjx8s55","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131"]},{"id":"https://openalex.org/I277688954","display_name":"Universit\u00e9 Paris-Saclay","ror":"https://ror.org/03xjwb503","country_code":"FR","type":"education","lineage":["https://openalex.org/I277688954"]},{"id":"https://openalex.org/I4210085861","display_name":"Laboratoire d'Int\u00e9gration des Syst\u00e8mes et des Technologies","ror":"https://ror.org/000dbcc61","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131","https://openalex.org/I2738703131","https://openalex.org/I277688954","https://openalex.org/I4210085861","https://openalex.org/I4210117989"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Chokri Mraidha","raw_affiliation_strings":["Universit&#x00E9; Paris-Saclay,CEA LIST,France"],"affiliations":[{"raw_affiliation_string":"Universit&#x00E9; Paris-Saclay,CEA LIST,France","institution_ids":["https://openalex.org/I277688954","https://openalex.org/I2738703131","https://openalex.org/I4210085861"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5133138106"],"corresponding_institution_ids":["https://openalex.org/I2738703131","https://openalex.org/I277688954","https://openalex.org/I4210085861"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.87289353,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"875","last_page":"880"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.3912000060081482,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.3912000060081482,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.13249999284744263,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11674","display_name":"Sports Analytics and Performance","score":0.0731000006198883,"subfield":{"id":"https://openalex.org/subfields/2002","display_name":"Economics and Econometrics"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.24480000138282776},{"id":"https://openalex.org/keywords/electromagnetic-shielding","display_name":"Electromagnetic shielding","score":0.23469999432563782}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4113999903202057},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.39750000834465027},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.3027999997138977},{"id":"https://openalex.org/C171146098","wikidata":"https://www.wikidata.org/wiki/Q124192","display_name":"Automotive engineering","level":1,"score":0.2865999937057495},{"id":"https://openalex.org/C199639397","wikidata":"https://www.wikidata.org/wiki/Q1788588","display_name":"Engineering drawing","level":1,"score":0.26019999384880066},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.24480000138282776},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.23770000040531158},{"id":"https://openalex.org/C2265751","wikidata":"https://www.wikidata.org/wiki/Q332007","display_name":"Electromagnetic shielding","level":2,"score":0.23469999432563782},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.2313999980688095},{"id":"https://openalex.org/C77595967","wikidata":"https://www.wikidata.org/wiki/Q3151013","display_name":"Forensic engineering","level":1,"score":0.22679999470710754}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icmla66185.2025.00130","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmla66185.2025.00130","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Machine Learning and Applications (ICMLA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W2169206416","https://openalex.org/W2902907165","https://openalex.org/W2963575966","https://openalex.org/W2966994213","https://openalex.org/W3003342008","https://openalex.org/W3138984732","https://openalex.org/W3202598378","https://openalex.org/W4249241440","https://openalex.org/W4295046628","https://openalex.org/W4306679387","https://openalex.org/W4385764501","https://openalex.org/W4392172476","https://openalex.org/W4402402057","https://openalex.org/W4415795277","https://openalex.org/W7133297822"],"related_works":[],"abstract_inverted_index":{"Agents":[0],"relying":[1],"purely":[2],"on":[3,164],"imitation":[4,136],"learning":[5,9,45,126,137],"(IL)":[6],"or":[7],"reinforcement":[8],"(RL)":[10],"often":[11],"struggle":[12],"to":[13,37,195,232],"avoid":[14],"safety-critical":[15],"errors":[16],"during":[17],"exploration.":[18],"Existing":[19],"RL":[20],"approaches":[21],"for":[22,57,118],"environments":[23],"such":[24,70,94,199],"as":[25,71,95,200,219],"chess":[26],"require":[27],"hundreds":[28],"of":[29,31,142],"thousands":[30],"episodes":[32],"and":[33,74,86,159,185,204],"substantial":[34],"computational":[35],"resources":[36],"converge.":[38],"Unlike":[39],"RL,":[40],"IL":[41,64],"enables":[42],"efficient":[43],"policy":[44],"from":[46,83,131,156],"expert":[47,157],"demonstrations":[48],"without":[49,236],"requiring":[50],"costly":[51],"trial-and-error":[52],"interaction,":[53],"making":[54],"it":[55],"well-suited":[56],"complex":[58],"domains":[59],"like":[60],"chess.":[61],"In":[62,104,139],"addition,":[63],"can":[65,99],"capture":[66],"nuanced,":[67],"human-aligned":[68],"behaviors":[69],"strategic":[72],"patterns":[73],"stylistic":[75],"preferences.":[76],"However,":[77],"IL-based":[78],"agents":[79],"may":[80],"inherit":[81],"biases":[82],"training":[84],"data":[85],"lack":[87],"safeguards":[88],"against":[89],"rare":[90],"but":[91],"critical":[92],"mistakes,":[93],"tactical":[96,168,238],"blunders":[97],"that":[98,181,210],"decisively":[100],"impact":[101],"game":[102],"outcomes.":[103],"this":[105],"work,":[106],"we":[107,144],"propose":[108],"Oracle-Guided":[109],"Soft":[110],"Shielding":[111],"(OGSS),":[112],"a":[113,127,146,149,160,178,214],"simple":[114],"yet":[115,190],"effective":[116],"framework":[117],"safer":[119],"move":[120,150,183],"prediction,":[121],"enabling":[122,188],"safe":[123,189],"exploration":[124,222,235],"by":[125,226],"probabilistic":[128],"safety":[129],"model":[130,152],"oracle":[132],"feedback":[133],"in":[134],"an":[135],"setting.":[138],"the":[140,172,220],"domain":[141],"chess,":[143],"employ":[145],"two-model":[147],"architecture:":[148],"prediction":[151],"predicts":[153],"strong":[154],"moves":[155,176],"games,":[158],"blunder":[161,186,216],"model,":[162],"trained":[163],"Stockfish":[165],"evaluations,":[166],"estimates":[167],"risk.":[169],"At":[170],"inference,":[171],"agent":[173],"scores":[174],"candidate":[175],"using":[177],"utility":[179],"function":[180],"combines":[182],"likelihood":[184],"probability,":[187],"competitive":[191],"game-play.":[192],"When":[193],"compared":[194],"other":[196],"prominent":[197],"methods":[198],"action":[201],"pruning,":[202],"SafeDAgger,":[203],"uncertainty-based":[205],"sampling,":[206],"our":[207],"results":[208],"demonstrate":[209],"OGSS":[211],"variants":[212],"maintain":[213],"lower":[215],"rate":[217],"even":[218],"agent\u2019s":[221],"ratio":[223],"is":[224],"increased":[225],"several":[227],"folds,":[228],"highlighting":[229],"its":[230],"ability":[231],"support":[233],"broader":[234],"compromising":[237],"soundness.":[239]},"counts_by_year":[],"updated_date":"2026-04-09T06:08:40.794217","created_date":"2026-04-08T00:00:00"}
