{"id":"https://openalex.org/W4400373649","doi":"https://doi.org/10.1145/3686924","title":"NLPGuard: A Framework for Mitigating the Use of Protected Attributes by NLP Classifiers","display_name":"NLPGuard: A Framework for Mitigating the Use of Protected Attributes by NLP Classifiers","publication_year":2024,"publication_date":"2024-11-07","ids":{"openalex":"https://openalex.org/W4400373649","doi":"https://doi.org/10.1145/3686924"},"language":"en","primary_location":{"id":"doi:10.1145/3686924","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3686924","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3686924","source":{"id":"https://openalex.org/S4210183893","display_name":"Proceedings of the ACM on Human-Computer Interaction","issn_l":"2573-0142","issn":["2573-0142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Human-Computer Interaction","raw_type":"journal-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3686924","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5061608915","display_name":"Salvatore Greco","orcid":"https://orcid.org/0000-0001-7239-9602"},"institutions":[{"id":"https://openalex.org/I177477856","display_name":"Polytechnic University of Turin","ror":"https://ror.org/00bgk9508","country_code":"IT","type":"education","lineage":["https://openalex.org/I177477856"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Salvatore Greco","raw_affiliation_strings":["Politecnico di Torino, Turin, Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Torino, Turin, Italy","institution_ids":["https://openalex.org/I177477856"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077592758","display_name":"Ke Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I4210098141","display_name":"Nokia (United Kingdom)","ror":"https://ror.org/00zpf0626","country_code":"GB","type":"company","lineage":["https://openalex.org/I2738502077","https://openalex.org/I4210098141"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Ke Zhou","raw_affiliation_strings":["Nokia Bell Labs, Cambridge, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Nokia Bell Labs, Cambridge, United Kingdom","institution_ids":["https://openalex.org/I4210098141"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023892723","display_name":"Licia Capra","orcid":"https://orcid.org/0000-0003-1425-3837"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Licia Capra","raw_affiliation_strings":["University College London, London, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University College London, London, United Kingdom","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053742461","display_name":"Tania Cerquitelli","orcid":"https://orcid.org/0000-0002-9039-6226"},"institutions":[{"id":"https://openalex.org/I177477856","display_name":"Polytechnic University of Turin","ror":"https://ror.org/00bgk9508","country_code":"IT","type":"education","lineage":["https://openalex.org/I177477856"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Tania Cerquitelli","raw_affiliation_strings":["Politecnico di Torino, Turin, Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Torino, Turin, Italy","institution_ids":["https://openalex.org/I177477856"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5081008532","display_name":"Daniele Quercia","orcid":"https://orcid.org/0000-0001-9461-5804"},"institutions":[{"id":"https://openalex.org/I4210098141","display_name":"Nokia (United Kingdom)","ror":"https://ror.org/00zpf0626","country_code":"GB","type":"company","lineage":["https://openalex.org/I2738502077","https://openalex.org/I4210098141"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Daniele Quercia","raw_affiliation_strings":["Nokia Bell Labs, Cambridge, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Nokia Bell Labs, Cambridge, United Kingdom","institution_ids":["https://openalex.org/I4210098141"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5061608915"],"corresponding_institution_ids":["https://openalex.org/I177477856"],"apc_list":null,"apc_paid":null,"fwci":1.772,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.86798841,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"8","issue":"CSCW2","first_page":"1","last_page":"25"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9642000198364258,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9642000198364258,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9423999786376953,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7868954539299011},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.7360140681266785},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7258390188217163},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6714493036270142},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.4613061547279358},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4546539783477783},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.4492446780204773}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7868954539299011},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.7360140681266785},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7258390188217163},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6714493036270142},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.4613061547279358},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4546539783477783},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.4492446780204773}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3686924","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3686924","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3686924","source":{"id":"https://openalex.org/S4210183893","display_name":"Proceedings of the ACM on Human-Computer Interaction","issn_l":"2573-0142","issn":["2573-0142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Human-Computer Interaction","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2407.01697","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.01697","pdf_url":"https://arxiv.org/pdf/2407.01697","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.1145/3686924","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3686924","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3686924","source":{"id":"https://openalex.org/S4210183893","display_name":"Proceedings of the ACM on Human-Computer Interaction","issn_l":"2573-0142","issn":["2573-0142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM on Human-Computer Interaction","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/5","display_name":"Gender equality","score":0.4699999988079071},{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.4000000059604645}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4400373649.pdf"},"referenced_works_count":43,"referenced_works":["https://openalex.org/W618024573","https://openalex.org/W648207664","https://openalex.org/W2053154970","https://openalex.org/W2081580037","https://openalex.org/W2114269021","https://openalex.org/W2282821441","https://openalex.org/W2493343568","https://openalex.org/W2557671501","https://openalex.org/W2618851150","https://openalex.org/W2791170418","https://openalex.org/W2799040448","https://openalex.org/W2893425640","https://openalex.org/W2898694742","https://openalex.org/W2909212904","https://openalex.org/W2952328691","https://openalex.org/W2962772482","https://openalex.org/W2962858109","https://openalex.org/W2962990575","https://openalex.org/W2963381846","https://openalex.org/W2964178496","https://openalex.org/W2996517240","https://openalex.org/W3033733989","https://openalex.org/W3034224415","https://openalex.org/W3035241006","https://openalex.org/W3094231174","https://openalex.org/W3101155149","https://openalex.org/W3117696238","https://openalex.org/W3134439870","https://openalex.org/W3134678353","https://openalex.org/W3176768410","https://openalex.org/W3181414820","https://openalex.org/W3190876505","https://openalex.org/W3202038256","https://openalex.org/W4205234189","https://openalex.org/W4214818205","https://openalex.org/W4220929609","https://openalex.org/W4221152344","https://openalex.org/W4283165820","https://openalex.org/W4287890982","https://openalex.org/W4289785153","https://openalex.org/W4380320058","https://openalex.org/W4385768144","https://openalex.org/W4404317831"],"related_works":["https://openalex.org/W4394984040","https://openalex.org/W2889302474","https://openalex.org/W2044488462","https://openalex.org/W2981877337","https://openalex.org/W3203938600","https://openalex.org/W2169074127","https://openalex.org/W2163707935","https://openalex.org/W83146503","https://openalex.org/W202723009","https://openalex.org/W4206462905"],"abstract_inverted_index":{"AI":[0],"regulations":[1],"are":[2],"expected":[3],"to":[4,62,124,150,169],"prohibit":[5],"machine":[6],"learning":[7],"models":[8],"from":[9],"using":[10],"sensitive":[11],"attributes":[12,55,87,117],"during":[13],"training.":[14],"However,":[15,161],"the":[16,33,64,83,153],"latest":[17],"Natural":[18],"Language":[19],"Processing":[20],"(NLP)":[21],"classifiers,":[22],"which":[23],"rely":[24],"on":[25,54,69,85,115,145],"deep":[26],"learning,":[27],"operate":[28],"as":[29,104],"black-box":[30],"systems,":[31],"complicating":[32],"detection":[34],"and":[35,100,133],"remediation":[36],"of":[37,67,152],"such":[38],"misuse.":[39],"Traditional":[40],"bias":[41],"mitigation":[42],"methods":[43],"in":[44,88],"NLP":[45,89,98,141],"aim":[46],"for":[47,81],"comparable":[48],"performance":[49],"across":[50],"different":[51],"groups":[52],"based":[53],"like":[56],"gender":[57],"or":[58],"race":[59],"but":[60],"fail":[61],"address":[63],"underlying":[65],"issue":[66],"reliance":[68,84,166],"protected":[70,86,116,146],"attributes.":[71,160],"To":[72],"partly":[73],"fix":[74],"that,":[75],"we":[76],"introduce":[77],"NLPGuard,":[78],"a":[79,107],"framework":[80],"mitigating":[82],"classifiers.":[90],"NLPGuard":[91,121,162],"takes":[92],"an":[93,96],"unlabeled":[94],"dataset,":[95],"existing":[97],"classifier,":[99],"its":[101],"training":[102,109],"data":[103],"input,":[105],"producing":[106],"modified":[108],"dataset":[110],"that":[111,139],"significantly":[112],"reduces":[113,164],"dependence":[114],"without":[118],"compromising":[119],"accuracy.":[120,174],"is":[122],"applied":[123],"three":[125],"classification":[126],"tasks:":[127],"identifying":[128],"toxic":[129],"language,":[130],"sentiment":[131],"analysis,":[132],"occupation":[134],"classification.":[135],"Our":[136],"evaluation":[137],"shows":[138],"current":[140],"classifiers":[142],"heavily":[143],"depend":[144],"attributes,":[147],"with":[148,158],"up":[149,168],"23%":[151],"most":[154],"predictive":[155],"words":[156],"associated":[157],"these":[159],"effectively":[163],"this":[165],"by":[167],"79%,":[170],"while":[171],"slightly":[172],"improving":[173]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
