{"id":"https://openalex.org/W4411934347","doi":"https://doi.org/10.1162/tacl_a_00758","title":"Exploring Practical Gaps in Using Cross Entropy to Implement Maximum Mutual Information Criterion for Rationalization","display_name":"Exploring Practical Gaps in Using Cross Entropy to Implement Maximum Mutual Information Criterion for Rationalization","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4411934347","doi":"https://doi.org/10.1162/tacl_a_00758"},"language":"en","primary_location":{"id":"doi:10.1162/tacl_a_00758","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00758","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00758/2534936/tacl_a_00758.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00758/2534936/tacl_a_00758.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100672694","display_name":"Wei Liu","orcid":"https://orcid.org/0000-0002-3871-9454"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wei Liu","raw_affiliation_strings":["School of Computer Science and Technology, HUST, China. idc_lw@hust.edu.cn"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, HUST, China. idc_lw@hust.edu.cn","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067698200","display_name":"Zhiying Deng","orcid":"https://orcid.org/0000-0002-8557-2619"},"institutions":[{"id":"https://openalex.org/I40963666","display_name":"Central China Normal University","ror":"https://ror.org/03x1jna21","country_code":"CN","type":"education","lineage":["https://openalex.org/I40963666"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiying Deng","raw_affiliation_strings":["Faculty of Artificial Intelligence in Education, Central China Normal University, China. zhiyingdzy@gmail.com"],"affiliations":[{"raw_affiliation_string":"Faculty of Artificial Intelligence in Education, Central China Normal University, China. zhiyingdzy@gmail.com","institution_ids":["https://openalex.org/I40963666"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113430787","display_name":"Zhongyu Niu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhongyu Niu","raw_affiliation_strings":["School of Computer Science and Technology, HUST, China. zy_niu@hust.edu.cn"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, HUST, China. zy_niu@hust.edu.cn","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100384838","display_name":"Jun Wang","orcid":"https://orcid.org/0000-0002-9515-076X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jun Wang","raw_affiliation_strings":["iWudao Tech, China. jwang@iwudao.tech"],"affiliations":[{"raw_affiliation_string":"iWudao Tech, China. jwang@iwudao.tech","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027119797","display_name":"Haozhao Wang","orcid":"https://orcid.org/0000-0002-7591-5315"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Haozhao Wang","raw_affiliation_strings":["School of Computer Science and Technology, HUST, China. hz_wang@hust.edu.cn"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, HUST, China. hz_wang@hust.edu.cn","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039670436","display_name":"Ruixuan Li","orcid":"https://orcid.org/0000-0002-7791-5511"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ruixuan Li","raw_affiliation_strings":["School of Computer Science and Technology, HUST, China. rxli@hust.edu.cn"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, HUST, China. rxli@hust.edu.cn","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100672694"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.2845,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.8961906,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"13","issue":null,"first_page":"577","last_page":"594"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9836000204086304,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9531000256538391,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mutual-information","display_name":"Mutual information","score":0.7784733772277832},{"id":"https://openalex.org/keywords/rationalization","display_name":"Rationalization (economics)","score":0.7751822471618652},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7314354777336121},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.5724903345108032},{"id":"https://openalex.org/keywords/management-science","display_name":"Management science","score":0.34853774309158325},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3313705325126648},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3275248408317566},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.27294182777404785},{"id":"https://openalex.org/keywords/epistemology","display_name":"Epistemology","score":0.13706842064857483},{"id":"https://openalex.org/keywords/thermodynamics","display_name":"Thermodynamics","score":0.08476969599723816},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.06432998180389404}],"concepts":[{"id":"https://openalex.org/C152139883","wikidata":"https://www.wikidata.org/wiki/Q252973","display_name":"Mutual information","level":2,"score":0.7784733772277832},{"id":"https://openalex.org/C52438962","wikidata":"https://www.wikidata.org/wiki/Q1555139","display_name":"Rationalization (economics)","level":2,"score":0.7751822471618652},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7314354777336121},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.5724903345108032},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.34853774309158325},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3313705325126648},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3275248408317566},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.27294182777404785},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.13706842064857483},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.08476969599723816},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.06432998180389404},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1162/tacl_a_00758","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00758","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00758/2534936/tacl_a_00758.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1162/tacl_a_00758","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00758","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00758/2534936/tacl_a_00758.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1231421488","display_name":null,"funder_award_id":"under","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1520791058","display_name":null,"funder_award_id":"62376103","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2878085913","display_name":null,"funder_award_id":"62206102","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4020255992","display_name":null,"funder_award_id":"Project","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4435229518","display_name":null,"funder_award_id":"62302184","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5939423041","display_name":null,"funder_award_id":"Technology","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7174558747","display_name":null,"funder_award_id":"Group","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7608752429","display_name":null,"funder_award_id":"Talent","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8683302537","display_name":null,"funder_award_id":"2024BAA008","funder_id":"https://openalex.org/F4320336744","funder_display_name":"Science and Technology Program of Hubei Province"},{"id":"https://openalex.org/G8955107213","display_name":null,"funder_award_id":"Major","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320318398","display_name":"Ant Group","ror":null},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321883","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null},{"id":"https://openalex.org/F4320336744","display_name":"Science and Technology Program of Hubei Province","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4411934347.pdf","grobid_xml":"https://content.openalex.org/works/W4411934347.grobid-xml"},"referenced_works_count":54,"referenced_works":["https://openalex.org/W2001259128","https://openalex.org/W2160409620","https://openalex.org/W2282821441","https://openalex.org/W2945976633","https://openalex.org/W2949227999","https://openalex.org/W2963233086","https://openalex.org/W2970155250","https://openalex.org/W2990138404","https://openalex.org/W3034917890","https://openalex.org/W3035064231","https://openalex.org/W3035503910","https://openalex.org/W3092083846","https://openalex.org/W3110300144","https://openalex.org/W3138819813","https://openalex.org/W3165967177","https://openalex.org/W3173436762","https://openalex.org/W3208024750","https://openalex.org/W3209901185","https://openalex.org/W4221146190","https://openalex.org/W4224950688","https://openalex.org/W4225881819","https://openalex.org/W4280546523","https://openalex.org/W4309634482","https://openalex.org/W4309674289","https://openalex.org/W4330337479","https://openalex.org/W4366999773","https://openalex.org/W4367692219","https://openalex.org/W4378711560","https://openalex.org/W4379468317","https://openalex.org/W4385570896","https://openalex.org/W4385571168","https://openalex.org/W4389520359","https://openalex.org/W4389523957","https://openalex.org/W4390833061","https://openalex.org/W6631190155","https://openalex.org/W6637162671","https://openalex.org/W6682208247","https://openalex.org/W6748458661","https://openalex.org/W6763711611","https://openalex.org/W6765807149","https://openalex.org/W6767284243","https://openalex.org/W6775269048","https://openalex.org/W6786048916","https://openalex.org/W6809646742","https://openalex.org/W6843285470","https://openalex.org/W6848998024","https://openalex.org/W6849497746","https://openalex.org/W6850627172","https://openalex.org/W6852855762","https://openalex.org/W6853999047","https://openalex.org/W6856385540","https://openalex.org/W6861315699","https://openalex.org/W6873370108","https://openalex.org/W6929545795"],"related_works":["https://openalex.org/W2036846997","https://openalex.org/W2112223184","https://openalex.org/W2347586617","https://openalex.org/W2161963661","https://openalex.org/W2125614474","https://openalex.org/W2295845123","https://openalex.org/W2358054814","https://openalex.org/W2090882960","https://openalex.org/W2889544313","https://openalex.org/W2165061339"],"abstract_inverted_index":{"Abstract":[0],"Rationalization":[1],"is":[2,222],"a":[3,14,25,29,44,130,145,169,191],"framework":[4],"that":[5,46,174],"aims":[6],"to":[7,67,78,118,127,137,160,179,190,199,211],"build":[8],"self-explanatory":[9],"NLP":[10],"models":[11],"by":[12,43,93],"extracting":[13],"subset":[15],"of":[16,19,36,71,91,102,110,155],"human-intelligible":[17,34],"pieces":[18],"their":[20],"inputting":[21],"texts.":[22],"It":[23],"involves":[24],"cooperative":[26],"game":[27],"where":[28],"selector":[30,77,125],"selects":[31],"the":[32,37,40,57,60,64,69,72,76,89,99,103,107,124,135,149,153,156,180,187,194],"most":[33],"parts":[35],"input":[38],"as":[39],"rationale,":[41],"followed":[42],"predictor":[45,136],"makes":[47],"predictions":[48,62],"based":[49],"on":[50],"these":[51,139],"selected":[52,73,181,195],"rationales.":[53],"Existing":[54],"literature":[55],"uses":[56],"cross-entropy":[58,150],"between":[59,148],"model\u2019s":[61],"and":[63,106,152],"ground-truth":[65],"labels":[66],"measure":[68],"informativeness":[70,101,154],"rationales,":[74],"guiding":[75],"choose":[79],"better":[80],"ones.":[81],"In":[82],"this":[83,122,165],"study,":[84],"we":[85,167],"first":[86],"theoretically":[87],"analyze":[88],"objective":[90,151],"rationalization":[92],"decomposing":[94],"it":[95],"into":[96],"two":[97],"parts:":[98],"model-agnostic":[100],"rationale":[104,157,182,196,207],"candidates":[105],"predictor\u2019s":[108,188],"degree":[109],"fit.":[111],"We":[112],"then":[113],"provide":[114],"various":[115],"empirical":[116],"evidence":[117],"support":[119],"that,":[120],"under":[121],"framework,":[123],"tends":[126],"sample":[128],"from":[129,224],"limited":[131],"small":[132],"region,":[133],"causing":[134],"overfit":[138],"localized":[140],"areas.":[141],"This":[142,184],"results":[143],"in":[144],"significant":[146],"mismatch":[147],"candidates,":[158],"leading":[159],"suboptimal":[161],"solutions.":[162],"To":[163],"address":[164],"issue,":[166],"propose":[168],"simple":[170],"yet":[171],"effective":[172],"method":[173,204],"introduces":[175],"random":[176],"vicinal1":[177],"perturbations":[178],"candidates.":[183],"approach":[185],"broadens":[186],"assessment":[189],"vicinity":[192],"around":[193],"candidate.":[197],"Compared":[198],"recent":[200],"competitive":[201],"methods,":[202],"our":[203],"significantly":[205],"improves":[206],"quality":[208],"(by":[209],"up":[210],"6.6%)":[212],"across":[213],"six":[214],"widely":[215],"used":[216],"classification":[217],"datasets.":[218],"The":[219],"term":[220],"\u201cvicinal\u201d":[221,232],"borrowed":[223],"vicinal":[225],"risk":[226],"minimization":[227],"(Chapelle":[228],"et":[229],"al.,":[230],"2000);":[231],"means":[233],"neighboring":[234],"or":[235],"adjacent.":[236]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-15T08:11:43.952461","created_date":"2025-10-10T00:00:00"}
