{"id":"https://openalex.org/W4403487557","doi":"https://doi.org/10.3233/faia240752","title":"Adversarial Attack for Explanation Robustness of Rationalization Models","display_name":"Adversarial Attack for Explanation Robustness of Rationalization Models","publication_year":2024,"publication_date":"2024-10-16","ids":{"openalex":"https://openalex.org/W4403487557","doi":"https://doi.org/10.3233/faia240752"},"language":"en","primary_location":{"id":"doi:10.3233/faia240752","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia240752","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.3233/faia240752","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053822540","display_name":"Yuankai Zhang","orcid":"https://orcid.org/0000-0002-2318-7539"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yuankai Zhang","raw_affiliation_strings":["School of Computer Science and Technology, Huazhong University of Science and Technology, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Huazhong University of Science and Technology, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111266379","display_name":"Lingxiao Kong","orcid":null},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lingxiao Kong","raw_affiliation_strings":["School of Computer Science and Technology, Huazhong University of Science and Technology, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Huazhong University of Science and Technology, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027119797","display_name":"Haozhao Wang","orcid":"https://orcid.org/0000-0002-7591-5315"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haozhao Wang","raw_affiliation_strings":["School of Computer Science and Technology, Huazhong University of Science and Technology, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Huazhong University of Science and Technology, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039670436","display_name":"Ruixuan Li","orcid":"https://orcid.org/0000-0002-7791-5511"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruixuan Li","raw_affiliation_strings":["School of Computer Science and Technology, Huazhong University of Science and Technology, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Huazhong University of Science and Technology, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101781466","display_name":"Jun Wang","orcid":"https://orcid.org/0000-0002-8926-156X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jun Wang","raw_affiliation_strings":["iWudao Tech"],"affiliations":[{"raw_affiliation_string":"iWudao Tech","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100432144","display_name":"Yuhua Li","orcid":"https://orcid.org/0000-0003-2913-4478"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuhua Li","raw_affiliation_strings":["School of Computer Science and Technology, Huazhong University of Science and Technology, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Huazhong University of Science and Technology, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102744395","display_name":"Wei Liu","orcid":"https://orcid.org/0009-0001-6664-2888"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Liu","raw_affiliation_strings":["School of Computer Science and Technology, Huazhong University of Science and Technology, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Huazhong University of Science and Technology, China","institution_ids":["https://openalex.org/I47720641"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5053822540"],"corresponding_institution_ids":["https://openalex.org/I47720641"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.38593339,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9890999794006348,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9890999794006348,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9376000165939331,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.7653859853744507},{"id":"https://openalex.org/keywords/rationalization","display_name":"Rationalization (economics)","score":0.7305202484130859},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5607852339744568},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5087171196937561},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.37628355622291565},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2601197361946106},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.21130585670471191},{"id":"https://openalex.org/keywords/microeconomics","display_name":"Microeconomics","score":0.1164618730545044},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.08668527007102966},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.0573979914188385}],"concepts":[{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.7653859853744507},{"id":"https://openalex.org/C52438962","wikidata":"https://www.wikidata.org/wiki/Q1555139","display_name":"Rationalization (economics)","level":2,"score":0.7305202484130859},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5607852339744568},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5087171196937561},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.37628355622291565},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2601197361946106},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.21130585670471191},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.1164618730545044},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.08668527007102966},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0573979914188385},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/faia240752","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia240752","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"}],"best_oa_location":{"id":"doi:10.3233/faia240752","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia240752","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2502115930","https://openalex.org/W2980745308","https://openalex.org/W2380441323","https://openalex.org/W2482350142","https://openalex.org/W2006855656","https://openalex.org/W4246396837","https://openalex.org/W3126451824"],"abstract_inverted_index":{"Rationalization":[0],"models,":[1],"which":[2,73],"select":[3,137],"a":[4,21,148],"subset":[5],"of":[6,32,41,79,126,131,150,158],"input":[7,109],"text":[8],"as":[9,20],"rationale\u2014crucial":[10],"for":[11,152],"humans":[12],"to":[13,47,75,110,136],"understand":[14],"and":[15,102,115],"trust":[16],"predictions\u2014have":[17],"recently":[18],"emerged":[19],"prominent":[22],"research":[23],"area":[24],"in":[25,89,129,156],"eXplainable":[26],"Artificial":[27],"Intelligence":[28],"(XAI).":[29],"However,":[30],"most":[31],"previous":[33],"studies":[34],"mainly":[35],"focus":[36],"on":[37,100,120,144],"improving":[38,153],"the":[39,42,52,61,77,97,107,113,124],"quality":[40],"rationale,":[43],"ignoring":[44],"its":[45],"robustness":[46],"malicious":[48],"attack.":[49,117],"Specifically,":[50],"whether":[51],"rationalization":[53,80,127,154],"models":[54,81,91,128,155],"can":[55],"still":[56],"generate":[57],"high-quality":[58],"rationale":[59],"under":[60,141],"adversarial":[62],"attack":[63],"remains":[64],"unknown.":[65],"To":[66],"explore":[67],"this,":[68,145],"this":[69],"paper":[70],"proposes":[71],"UAT2E,":[72],"aims":[74],"undermine":[76],"explainability":[78],"without":[82],"altering":[83],"their":[84],"predictions,":[85],"thereby":[86],"eliciting":[87],"distrust":[88],"these":[90],"from":[92],"human":[93],"users.":[94],"UAT2E":[95],"employs":[96],"gradient-based":[98],"search":[99],"triggers":[101],"then":[103],"inserts":[104],"them":[105],"into":[106],"original":[108],"conduct":[111],"both":[112],"non-target":[114],"target":[116],"Experimental":[118],"results":[119],"five":[121],"datasets":[122],"reveal":[123],"vulnerability":[125],"terms":[130,157],"explanation,":[132],"where":[133],"they":[134],"tend":[135],"more":[138],"meaningless":[139],"tokens":[140],"attacks.":[142],"Based":[143],"we":[146],"make":[147],"series":[149],"recommendations":[151],"explanation.":[159]},"counts_by_year":[],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
