{"id":"https://openalex.org/W4416873168","doi":"https://doi.org/10.1109/tkde.2025.3638864","title":"Learnable Game-Theoretic Policy Optimization for Data-Centric Self-Explanation Rationalization","display_name":"Learnable Game-Theoretic Policy Optimization for Data-Centric Self-Explanation Rationalization","publication_year":2025,"publication_date":"2025-12-01","ids":{"openalex":"https://openalex.org/W4416873168","doi":"https://doi.org/10.1109/tkde.2025.3638864"},"language":null,"primary_location":{"id":"doi:10.1109/tkde.2025.3638864","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tkde.2025.3638864","pdf_url":null,"source":{"id":"https://openalex.org/S30698027","display_name":"IEEE Transactions on Knowledge and Data Engineering","issn_l":"1041-4347","issn":["1041-4347","1558-2191","2326-3865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Knowledge and Data Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103153753","display_name":"Yunxiao Zhao","orcid":"https://orcid.org/0000-0002-9133-7324"},"institutions":[{"id":"https://openalex.org/I181877577","display_name":"Shanxi University","ror":"https://ror.org/03y3e3s17","country_code":"CN","type":"education","lineage":["https://openalex.org/I181877577"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yunxiao Zhao","raw_affiliation_strings":["School of Computer and Information Technology, Shanxi University, Taiyuan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Information Technology, Shanxi University, Taiyuan, China","institution_ids":["https://openalex.org/I181877577"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100404740","display_name":"Zhiqiang Wang","orcid":"https://orcid.org/0000-0002-9269-3988"},"institutions":[{"id":"https://openalex.org/I181877577","display_name":"Shanxi University","ror":"https://ror.org/03y3e3s17","country_code":"CN","type":"education","lineage":["https://openalex.org/I181877577"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiqiang Wang","raw_affiliation_strings":["School of Computer and Information Technology, Shanxi University, Taiyuan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Information Technology, Shanxi University, Taiyuan, China","institution_ids":["https://openalex.org/I181877577"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048717995","display_name":"Xingtong Yu","orcid":"https://orcid.org/0000-0002-2884-8578"},"institutions":[{"id":"https://openalex.org/I79891267","display_name":"Singapore Management University","ror":"https://ror.org/050qmg959","country_code":"SG","type":"education","lineage":["https://openalex.org/I79891267"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Xingtong Yu","raw_affiliation_strings":["School of Computer and Information Systems, Singapore Management University, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Computer and Information Systems, Singapore Management University, Singapore","institution_ids":["https://openalex.org/I79891267"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100418684","display_name":"Xiaoli Li","orcid":"https://orcid.org/0000-0002-0762-6562"},"institutions":[{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Xiaoli Li","raw_affiliation_strings":["Institute for Infocomm Research, Singapore","Institute for Infocomm Research, A*Star, Singapore"],"affiliations":[{"raw_affiliation_string":"Institute for Infocomm Research, Singapore","institution_ids":["https://openalex.org/I3005327000"]},{"raw_affiliation_string":"Institute for Infocomm Research, A*Star, Singapore","institution_ids":["https://openalex.org/I3005327000"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106626932","display_name":"Jiye Liang","orcid":"https://orcid.org/0000-0001-5887-9327"},"institutions":[{"id":"https://openalex.org/I181877577","display_name":"Shanxi University","ror":"https://ror.org/03y3e3s17","country_code":"CN","type":"education","lineage":["https://openalex.org/I181877577"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiye Liang","raw_affiliation_strings":["School of Computer and Information Technology, Shanxi University, Taiyuan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Information Technology, Shanxi University, Taiyuan, China","institution_ids":["https://openalex.org/I181877577"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100697664","display_name":"Ru Li","orcid":"https://orcid.org/0000-0003-1545-5553"},"institutions":[{"id":"https://openalex.org/I181877577","display_name":"Shanxi University","ror":"https://ror.org/03y3e3s17","country_code":"CN","type":"education","lineage":["https://openalex.org/I181877577"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ru Li","raw_affiliation_strings":["School of Computer and Information Technology, Shanxi University, Taiyuan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Information Technology, Shanxi University, Taiyuan, China","institution_ids":["https://openalex.org/I181877577"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5103153753"],"corresponding_institution_ids":["https://openalex.org/I181877577"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.20917864,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"38","issue":"2","first_page":"1159","last_page":"1173"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.7580999732017517,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.7580999732017517,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.04699999839067459,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.012900000438094139,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/rationalization","display_name":"Rationalization (economics)","score":0.807200014591217},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.4945000112056732},{"id":"https://openalex.org/keywords/generator","display_name":"Generator (circuit theory)","score":0.45260000228881836},{"id":"https://openalex.org/keywords/game-theory","display_name":"Game theory","score":0.44760000705718994},{"id":"https://openalex.org/keywords/nash-equilibrium","display_name":"Nash equilibrium","score":0.4072999954223633},{"id":"https://openalex.org/keywords/outcome","display_name":"Outcome (game theory)","score":0.3677999973297119}],"concepts":[{"id":"https://openalex.org/C52438962","wikidata":"https://www.wikidata.org/wiki/Q1555139","display_name":"Rationalization (economics)","level":2,"score":0.807200014591217},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7775999903678894},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.4945000112056732},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.45260000228881836},{"id":"https://openalex.org/C177142836","wikidata":"https://www.wikidata.org/wiki/Q44455","display_name":"Game theory","level":2,"score":0.44760000705718994},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.44119998812675476},{"id":"https://openalex.org/C46814582","wikidata":"https://www.wikidata.org/wiki/Q23389","display_name":"Nash equilibrium","level":2,"score":0.4072999954223633},{"id":"https://openalex.org/C148220186","wikidata":"https://www.wikidata.org/wiki/Q7111912","display_name":"Outcome (game theory)","level":2,"score":0.3677999973297119},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.3125999867916107},{"id":"https://openalex.org/C164407509","wikidata":"https://www.wikidata.org/wiki/Q5384490","display_name":"Equilibrium selection","level":4,"score":0.3043999969959259},{"id":"https://openalex.org/C144237770","wikidata":"https://www.wikidata.org/wiki/Q747534","display_name":"Mathematical economics","level":1,"score":0.2752000093460083},{"id":"https://openalex.org/C146930158","wikidata":"https://www.wikidata.org/wiki/Q656416","display_name":"Extensive-form game","level":4,"score":0.27410000562667847},{"id":"https://openalex.org/C73795354","wikidata":"https://www.wikidata.org/wiki/Q287618","display_name":"Sequential game","level":3,"score":0.2678000032901764},{"id":"https://openalex.org/C94766913","wikidata":"https://www.wikidata.org/wiki/Q1530271","display_name":"Equilibrium point","level":3,"score":0.26260000467300415},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.2538999915122986}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tkde.2025.3638864","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tkde.2025.3638864","pdf_url":null,"source":{"id":"https://openalex.org/S30698027","display_name":"IEEE Transactions on Knowledge and Data Engineering","issn_l":"1041-4347","issn":["1041-4347","1558-2191","2326-3865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Knowledge and Data Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W2001259128","https://openalex.org/W2024390895","https://openalex.org/W2160409620","https://openalex.org/W2250539671","https://openalex.org/W2516809705","https://openalex.org/W2788403449","https://openalex.org/W2889436406","https://openalex.org/W2949227999","https://openalex.org/W2950635152","https://openalex.org/W2963029083","https://openalex.org/W2963233086","https://openalex.org/W2970155250","https://openalex.org/W3034917890","https://openalex.org/W3035503910","https://openalex.org/W3092083846","https://openalex.org/W3105868192","https://openalex.org/W3138819813","https://openalex.org/W3165967177","https://openalex.org/W4225881819","https://openalex.org/W4283796092","https://openalex.org/W4309634482","https://openalex.org/W4309674289","https://openalex.org/W4375869251","https://openalex.org/W4378711560","https://openalex.org/W4385570896","https://openalex.org/W4385571168","https://openalex.org/W4385571271","https://openalex.org/W4389520103","https://openalex.org/W4389520359","https://openalex.org/W4389524578","https://openalex.org/W4391099575","https://openalex.org/W4393147214","https://openalex.org/W4394711241","https://openalex.org/W4400909704","https://openalex.org/W4402671152","https://openalex.org/W4402671449","https://openalex.org/W4404782742","https://openalex.org/W4406123692","https://openalex.org/W4411934347","https://openalex.org/W7117997420"],"related_works":[],"abstract_inverted_index":{"Rationalization,":[0],"a":[1,16,27,32,46,77,110,122,154,172,209,221],"data-centric":[2],"framework,":[3],"aims":[4],"to":[5,9,65,139,143,151,153,194,253],"build":[6],"self-explanatory":[7],"models":[8],"explain":[10],"the":[11,22,35,40,84,90,128,134,149,196,200,206,217,226,229],"prediction":[12],"outcome":[13],"by":[14,45],"generating":[15],"subset":[17],"of":[18,21,39,131,219,228],"human-intelligible":[19,37],"pieces":[20],"input":[23,41],"data.":[24],"It":[25],"involves":[26],"cooperative":[28,119,201],"game":[29,156,197,202],"model":[30,207],"where":[31,247],"generator":[33,91,135],"generates":[34],"most":[36],"parts":[38],"(i.e.,":[42],"rationales),":[43],"followed":[44],"predictor":[47,85],"that":[48],"makes":[49],"predictions":[50,88,159],"based":[51],"on":[52,237],"these":[53,72],"generated":[54],"rationales.":[55],"Conventional":[56],"rationalization":[57,120],"methods":[58,73],"typically":[59,102],"impose":[60],"constraints":[61],"via":[62],"regularization":[63],"terms":[64],"calibrate":[66],"or":[67],"penalize":[68],"undesired":[69],"generation.":[70],"However,":[71],"are":[74,101,264],"suffering":[75],"from":[76,121],"problem":[78],"called":[79],"mode":[80],"collapse,":[81],"in":[82,199],"which":[83,189],"produces":[86],"correct":[87],"yet":[89],"consistently":[92],"outputs":[93],"rationales":[94],"with":[95],"collapsed":[96,107,163],"patterns.":[97],"Moreover,":[98],"existing":[99,258],"studies":[100],"designed":[103],"separately":[104],"for":[105],"specific":[106],"patterns,":[108],"lacking":[109],"unified":[111],"consideration.":[112],"In":[113],"this":[114,132,167],"paper,":[115],"we":[116,169,233],"systematically":[117],"revisit":[118],"novel":[123,173],"game-theoretic":[124],"perspective":[125],"and":[126,224,243,262],"identify":[127],"fundamental":[129],"cause":[130,218],"problem:":[133],"no":[136],"longer":[137],"tends":[138],"explore":[140],"new":[141],"strategies":[142],"uncover":[144],"informative":[145],"rationales,":[146],"ultimately":[147],"leading":[148],"system":[150],"converge":[152],"suboptimal":[155,222],"equilibrium":[157,198,223],"(correct":[158],"<italic":[160],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[161,177,180,184,187,249,268],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">v.s</i>":[162],"rationales).":[164],"To":[165],"solve":[166],"problem,":[168],"then":[170],"propose":[171],"approach,":[174],"Game-theoretic":[175],"<bold":[176,179,183],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">P</b>olicy":[178],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">O</b>ptimization":[181],"oriented":[182],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">RAT</b>ionalization":[185],"(<sc":[186],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">PoRat</small>),":[188],"progressively":[190],"introduces":[191],"policy":[192],"interventions":[193],"address":[195],"process,":[203],"thereby":[204],"guiding":[205],"toward":[208],"more":[210],"optimal":[211],"solution":[212],"state.":[213],"We":[214],"theoretically":[215],"analyse":[216],"such":[220],"prove":[225],"feasibility":[227],"proposed":[230],"method.":[231],"Furthermore,":[232],"validate":[234],"our":[235],"method":[236],"nine":[238],"widely":[239],"used":[240],"real-world":[241],"datasets":[242],"two":[244],"synthetic":[245],"settings,":[246],"<sc":[248],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">PoRat</small>":[250],"achieves":[251],"up":[252],"8.1%":[254],"performance":[255],"improvements":[256],"over":[257],"state-of-the-art":[259],"methods.":[260],"Code":[261],"data":[263],"available":[265],"at":[266],"<uri":[267],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">anonymous.4open.science/r/Rationalization-PORAT-ECE9</uri>.":[269]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-12-01T00:00:00"}
