{"id":"https://openalex.org/W7089321813","doi":"https://doi.org/10.1007/978-3-032-08330-2_7","title":"Mitigating Text Toxicity with\u00a0Counterfactual Generation","display_name":"Mitigating Text Toxicity with\u00a0Counterfactual Generation","publication_year":2025,"publication_date":"2025-10-13","ids":{"openalex":"https://openalex.org/W7089321813","doi":"https://doi.org/10.1007/978-3-032-08330-2_7"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-032-08330-2_7","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-032-08330-2_7","pdf_url":"https://link.springer.com/content/pdf/10.1007/978-3-032-08330-2_7.pdf","source":{"id":"https://openalex.org/S2764900261","display_name":"Communications in computer and information science","issn_l":"1865-0929","issn":["1865-0929","1865-0937"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Communications in Computer and Information Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/978-3-032-08330-2_7.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Milan Bhan","orcid":null},"institutions":[{"id":"https://openalex.org/I39804081","display_name":"Sorbonne Universit\u00e9","ror":"https://ror.org/02en5vm52","country_code":"FR","type":"education","lineage":["https://openalex.org/I39804081"]},{"id":"https://openalex.org/I51101395","display_name":"Universit\u00e9 Paris 1 Panth\u00e9on-Sorbonne","ror":"https://ror.org/002t25c44","country_code":"FR","type":"education","lineage":["https://openalex.org/I51101395"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Milan Bhan","raw_affiliation_strings":["Ekimetrics, Paris, France","LFI, LIP6, Sorbonne Universit\u00e9, Paris, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Ekimetrics, Paris, France","institution_ids":[]},{"raw_affiliation_string":"LFI, LIP6, Sorbonne Universit\u00e9, Paris, France","institution_ids":["https://openalex.org/I39804081","https://openalex.org/I51101395"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jean-Noel Vittaut","orcid":null},"institutions":[{"id":"https://openalex.org/I39804081","display_name":"Sorbonne Universit\u00e9","ror":"https://ror.org/02en5vm52","country_code":"FR","type":"education","lineage":["https://openalex.org/I39804081"]},{"id":"https://openalex.org/I51101395","display_name":"Universit\u00e9 Paris 1 Panth\u00e9on-Sorbonne","ror":"https://ror.org/002t25c44","country_code":"FR","type":"education","lineage":["https://openalex.org/I51101395"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Jean-Noel Vittaut","raw_affiliation_strings":["LFI, LIP6, Sorbonne Universit\u00e9, Paris, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"LFI, LIP6, Sorbonne Universit\u00e9, Paris, France","institution_ids":["https://openalex.org/I39804081","https://openalex.org/I51101395"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Nina Achache","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nina Achache","raw_affiliation_strings":["Ekimetrics, Paris, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Ekimetrics, Paris, France","institution_ids":[]}]},{"author_position":"middle","author":{"id":null,"display_name":"Victor Legrand","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Victor Legrand","raw_affiliation_strings":["Ekimetrics, Paris, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Ekimetrics, Paris, France","institution_ids":[]}]},{"author_position":"middle","author":{"id":null,"display_name":"Annabelle Blangero","orcid":null},"institutions":[{"id":"https://openalex.org/I21491767","display_name":"Aix-Marseille Universit\u00e9","ror":"https://ror.org/035xkbk20","country_code":"FR","type":"education","lineage":["https://openalex.org/I21491767"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Annabelle Blangero","raw_affiliation_strings":["Aix-Marseille Universit\u00e9, Aix-Marseille, France","Ekimetrics, Paris, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Aix-Marseille Universit\u00e9, Aix-Marseille, France","institution_ids":["https://openalex.org/I21491767"]},{"raw_affiliation_string":"Ekimetrics, Paris, France","institution_ids":[]}]},{"author_position":"middle","author":{"id":null,"display_name":"Nicolas Chesneau","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nicolas Chesneau","raw_affiliation_strings":["Ekimetrics, Paris, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Ekimetrics, Paris, France","institution_ids":[]}]},{"author_position":"middle","author":{"id":null,"display_name":"Juliette Murris","orcid":null},"institutions":[{"id":"https://openalex.org/I204730241","display_name":"Universit\u00e9 Paris Cit\u00e9","ror":"https://ror.org/05f82e368","country_code":"FR","type":"education","lineage":["https://openalex.org/I204730241"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Juliette Murris","raw_affiliation_strings":["Universit\u00e9 Paris Cit\u00e9, Paris, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universit\u00e9 Paris Cit\u00e9, Paris, France","institution_ids":["https://openalex.org/I204730241"]}]},{"author_position":"last","author":{"id":null,"display_name":"Marie-Jeanne Lesot","orcid":null},"institutions":[{"id":"https://openalex.org/I39804081","display_name":"Sorbonne Universit\u00e9","ror":"https://ror.org/02en5vm52","country_code":"FR","type":"education","lineage":["https://openalex.org/I39804081"]},{"id":"https://openalex.org/I51101395","display_name":"Universit\u00e9 Paris 1 Panth\u00e9on-Sorbonne","ror":"https://ror.org/002t25c44","country_code":"FR","type":"education","lineage":["https://openalex.org/I51101395"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Marie-Jeanne Lesot","raw_affiliation_strings":["LFI, LIP6, Sorbonne Universit\u00e9, Paris, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"LFI, LIP6, Sorbonne Universit\u00e9, Paris, France","institution_ids":["https://openalex.org/I39804081","https://openalex.org/I51101395"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I39804081","https://openalex.org/I51101395"],"apc_list":null,"apc_paid":null,"fwci":3.3248,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.94383816,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"135","last_page":"157"},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.718500018119812,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.718500018119812,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.0649000033736229,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.05119999870657921,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/counterfactual-thinking","display_name":"Counterfactual thinking","score":0.9646000266075134},{"id":"https://openalex.org/keywords/offensive","display_name":"Offensive","score":0.5527999997138977},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5198000073432922},{"id":"https://openalex.org/keywords/detoxification","display_name":"Detoxification (alternative medicine)","score":0.44449999928474426},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4169999957084656},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.38119998574256897}],"concepts":[{"id":"https://openalex.org/C108650721","wikidata":"https://www.wikidata.org/wiki/Q1783253","display_name":"Counterfactual thinking","level":2,"score":0.9646000266075134},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7300000190734863},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5942000150680542},{"id":"https://openalex.org/C176856949","wikidata":"https://www.wikidata.org/wiki/Q2001676","display_name":"Offensive","level":2,"score":0.5527999997138977},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5198000073432922},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4828000068664551},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4471000134944916},{"id":"https://openalex.org/C2780497538","wikidata":"https://www.wikidata.org/wiki/Q1192006","display_name":"Detoxification (alternative medicine)","level":3,"score":0.44449999928474426},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4169999957084656},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.38119998574256897},{"id":"https://openalex.org/C2985684807","wikidata":"https://www.wikidata.org/wiki/Q1513879","display_name":"Text generation","level":2,"score":0.3603000044822693},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.35199999809265137},{"id":"https://openalex.org/C2776187449","wikidata":"https://www.wikidata.org/wiki/Q1513879","display_name":"Natural language generation","level":3,"score":0.32739999890327454},{"id":"https://openalex.org/C2780876879","wikidata":"https://www.wikidata.org/wiki/Q3054749","display_name":"Meaning (existential)","level":2,"score":0.2856999933719635},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2578999996185303}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/978-3-032-08330-2_7","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-032-08330-2_7","pdf_url":"https://link.springer.com/content/pdf/10.1007/978-3-032-08330-2_7.pdf","source":{"id":"https://openalex.org/S2764900261","display_name":"Communications in computer and information science","issn_l":"1865-0929","issn":["1865-0929","1865-0937"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Communications in Computer and Information Science","raw_type":"book-chapter"},{"id":"pmh:oai:HAL:hal-05478259v1","is_oa":false,"landing_page_url":"https://hal.science/hal-05478259","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"3rd World Conference on Explainable Artificial Intelligence (xAI 2025), Jul 2025, Istanbul, Turkey. pp.135-157, &#x27E8;10.1007/978-3-032-08330-2_7&#x27E9;","raw_type":"Conference papers"}],"best_oa_location":{"id":"doi:10.1007/978-3-032-08330-2_7","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-032-08330-2_7","pdf_url":"https://link.springer.com/content/pdf/10.1007/978-3-032-08330-2_7.pdf","source":{"id":"https://openalex.org/S2764900261","display_name":"Communications in computer and information science","issn_l":"1865-0929","issn":["1865-0929","1865-0937"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Communications in Computer and Information Science","raw_type":"book-chapter"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.794166088104248,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7089321813.pdf","grobid_xml":"https://content.openalex.org/works/W7089321813.grobid-xml"},"referenced_works_count":38,"referenced_works":["https://openalex.org/W2058373514","https://openalex.org/W2101105183","https://openalex.org/W2250539671","https://openalex.org/W2810732061","https://openalex.org/W2887782043","https://openalex.org/W2962937198","https://openalex.org/W2963095307","https://openalex.org/W2964449086","https://openalex.org/W2970641574","https://openalex.org/W2981731882","https://openalex.org/W3034999214","https://openalex.org/W3102641573","https://openalex.org/W3118208174","https://openalex.org/W3125759795","https://openalex.org/W3133702157","https://openalex.org/W3142348814","https://openalex.org/W3153611199","https://openalex.org/W3173813266","https://openalex.org/W3197945602","https://openalex.org/W3208191520","https://openalex.org/W3212327893","https://openalex.org/W4205923021","https://openalex.org/W4206112645","https://openalex.org/W4206299995","https://openalex.org/W4224275454","https://openalex.org/W4225150645","https://openalex.org/W4283274728","https://openalex.org/W4283318425","https://openalex.org/W4366262984","https://openalex.org/W4385566954","https://openalex.org/W4385572663","https://openalex.org/W4385734234","https://openalex.org/W4386242338","https://openalex.org/W4386804066","https://openalex.org/W4386834659","https://openalex.org/W4387818804","https://openalex.org/W4389520058","https://openalex.org/W4390712116"],"related_works":[],"abstract_inverted_index":{"Abstract":[0],"Toxicity":[1],"mitigation":[2],"consists":[3],"in":[4,7,137],"rephrasing":[5],"text":[6,37,79,107,153],"order":[8],"to":[9,25,35,53,59,77,94,119,134,145],"remove":[10],"offensive":[11],"or":[12],"harmful":[13],"meaning.":[14],"Neural":[15],"natural":[16],"language":[17],"processing":[18],"(NLP)":[19],"models":[20],"have":[21],"been":[22],"widely":[23],"used":[24],"target":[26,61],"and":[27,62,89,101,115,123,152,155],"mitigate":[28,63],"textual":[29,64],"toxicity.":[30,65],"However,":[31],"existing":[32],"methods":[33,58,93],"fail":[34],"detoxify":[36],"while":[38],"preserving":[39],"the":[40,45,143,147,157],"initial":[41],"non-toxic":[42,102],"meaning":[43],"at":[44],"same":[46],"time.":[47],"In":[48],"this":[49],"work,":[50],"we":[51],"propose":[52,67],"apply":[54],"eXplainable":[55],"AI":[56],"(XAI)":[57],"both":[60],"We":[66,104],"$$_{\\text":[68],"{tigtec}}$$":[69],"<mml:math":[70],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\">":[71],"<mml:msub>":[72],"<mml:mrow/>":[73],"<mml:mi>tigtec</mml:mi>":[74],"</mml:msub>":[75],"</mml:math>":[76],"perform":[78],"detoxification":[80,108,154],"by":[81],"applying":[82],"local":[83],"feature":[84,91],"importance,":[85],"counterfactual":[86,90,110,131,150],"example":[87],"generation":[88,111,151],"importance":[92],"a":[95],"toxicity":[96,138],"classifier":[97],"distinguishing":[98],"between":[99,149],"toxic":[100],"texts.":[103],"carry":[105],"out":[106],"through":[109],"on":[112],"three":[113,120],"datasets":[114],"compare":[116],"our":[117],"approach":[118],"competitors.":[121],"Automatic":[122],"human":[124],"evaluations":[125],"show":[126],"that":[127],"recently":[128],"developed":[129],"NLP":[130],"generators":[132],"lead":[133],"competitive":[135],"results":[136],"mitigation.":[139],"This":[140],"work":[141],"is":[142],"first":[144],"bridge":[146],"gap":[148],"paves":[156],"way":[158],"towards":[159],"more":[160],"practical":[161],"applications":[162],"of":[163],"XAI":[164],"methods.":[165]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-13T06:13:01.061226","created_date":"2025-10-13T00:00:00"}
