{"id":"https://openalex.org/W4386242314","doi":"https://doi.org/10.1145/3600211.3604657","title":"Fairness Implications of Encoding Protected Categorical Attributes","display_name":"Fairness Implications of Encoding Protected Categorical Attributes","publication_year":2023,"publication_date":"2023-08-08","ids":{"openalex":"https://openalex.org/W4386242314","doi":"https://doi.org/10.1145/3600211.3604657"},"language":"en","primary_location":{"id":"doi:10.1145/3600211.3604657","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3600211.3604657","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2023 AAAI/ACM Conference on AI, Ethics, and Society","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058755772","display_name":"Carlos Mougan","orcid":"https://orcid.org/0000-0002-3137-6890"},"institutions":[{"id":"https://openalex.org/I43439940","display_name":"University of Southampton","ror":"https://ror.org/01ryk1543","country_code":"GB","type":"education","lineage":["https://openalex.org/I43439940"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Carlos Mougan","raw_affiliation_strings":["Electronic and Computer Science, Univeristy of Southampton, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Electronic and Computer Science, Univeristy of Southampton, United Kingdom","institution_ids":["https://openalex.org/I43439940"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081978740","display_name":"Jos\u00e9 M. \u00c1lvarez","orcid":"https://orcid.org/0000-0001-9412-9013"},"institutions":[{"id":"https://openalex.org/I108290504","display_name":"University of Pisa","ror":"https://ror.org/03ad39j10","country_code":"IT","type":"education","lineage":["https://openalex.org/I108290504"]},{"id":"https://openalex.org/I157210198","display_name":"Scuola Normale Superiore","ror":"https://ror.org/03aydme10","country_code":"IT","type":"education","lineage":["https://openalex.org/I157210198"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Jose Manuel Alvarez","raw_affiliation_strings":["Computer Science, University of Pisa, Italy and Scuola Normale Superiore, Italy"],"affiliations":[{"raw_affiliation_string":"Computer Science, University of Pisa, Italy and Scuola Normale Superiore, Italy","institution_ids":["https://openalex.org/I157210198","https://openalex.org/I108290504"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071524745","display_name":"Salvatore Ruggieri","orcid":"https://orcid.org/0000-0002-1917-6087"},"institutions":[{"id":"https://openalex.org/I108290504","display_name":"University of Pisa","ror":"https://ror.org/03ad39j10","country_code":"IT","type":"education","lineage":["https://openalex.org/I108290504"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Salvatore Ruggieri","raw_affiliation_strings":["Dipartimento di Informatica, Universit\u00e0 di Pisa, Italy"],"affiliations":[{"raw_affiliation_string":"Dipartimento di Informatica, Universit\u00e0 di Pisa, Italy","institution_ids":["https://openalex.org/I108290504"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5062807811","display_name":"Steffen Staab","orcid":"https://orcid.org/0000-0002-0780-4154"},"institutions":[{"id":"https://openalex.org/I100066346","display_name":"University of Stuttgart","ror":"https://ror.org/04vnq7t77","country_code":"DE","type":"education","lineage":["https://openalex.org/I100066346"]},{"id":"https://openalex.org/I43439940","display_name":"University of Southampton","ror":"https://ror.org/01ryk1543","country_code":"GB","type":"education","lineage":["https://openalex.org/I43439940"]}],"countries":["DE","GB"],"is_corresponding":false,"raw_author_name":"Steffen Staab","raw_affiliation_strings":["Universit\u00e4t Stuttgart, Germany and Univeristy of Southampton, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Universit\u00e4t Stuttgart, Germany and Univeristy of Southampton, United Kingdom","institution_ids":["https://openalex.org/I43439940","https://openalex.org/I100066346"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5058755772"],"corresponding_institution_ids":["https://openalex.org/I43439940"],"apc_list":null,"apc_paid":null,"fwci":2.3031,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.90664869,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"454","last_page":"465"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/categorical-variable","display_name":"Categorical variable","score":0.8958839774131775},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.7372956275939941},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6785827875137329},{"id":"https://openalex.org/keywords/boosting","display_name":"Boosting (machine learning)","score":0.6289514899253845},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.624895453453064},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.572413980960846},{"id":"https://openalex.org/keywords/cardinality","display_name":"Cardinality (data modeling)","score":0.4902346730232239},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.47508516907691956},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.23652055859565735}],"concepts":[{"id":"https://openalex.org/C5274069","wikidata":"https://www.wikidata.org/wiki/Q2285707","display_name":"Categorical variable","level":2,"score":0.8958839774131775},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.7372956275939941},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6785827875137329},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.6289514899253845},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.624895453453064},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.572413980960846},{"id":"https://openalex.org/C87117476","wikidata":"https://www.wikidata.org/wiki/Q362383","display_name":"Cardinality (data modeling)","level":2,"score":0.4902346730232239},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.47508516907691956},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.23652055859565735}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3600211.3604657","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3600211.3604657","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2023 AAAI/ACM Conference on AI, Ethics, and Society","raw_type":"proceedings-article"},{"id":"pmh:oai:arpi.unipi.it:11568/1216550","is_oa":false,"landing_page_url":"https://hdl.handle.net/11568/1216550","pdf_url":null,"source":{"id":"https://openalex.org/S4377196265","display_name":"CINECA IRIS Institutial research information system (University of Pisa)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I108290504","host_organization_name":"University of Pisa","host_organization_lineage":["https://openalex.org/I108290504"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/conferenceObject"},{"id":"pmh:oai:ricerca.sns.it:11384/138704","is_oa":false,"landing_page_url":"https://hdl.handle.net/11384/138704","pdf_url":null,"source":{"id":"https://openalex.org/S7407050981","display_name":"Scuola Normale Superiore di Pisa","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.5699999928474426,"id":"https://metadata.un.org/sdg/16"},{"display_name":"Reduced inequalities","score":0.4300000071525574,"id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G1974542962","display_name":null,"funder_award_id":"Sk\u0142odowska","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G2689612763","display_name":null,"funder_award_id":"Marie","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G2786304416","display_name":null,"funder_award_id":"Marie Sk\u0142odowska-Curie Action","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G4956428346","display_name":null,"funder_award_id":"Horizon 2020 research and innovatio","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G6100177302","display_name":null,"funder_award_id":"Sk\u0142odowska","funder_id":"https://openalex.org/F4320338337","funder_display_name":"H2020 Marie Sk\u0142odowska-Curie Actions"},{"id":"https://openalex.org/G6814690871","display_name":null,"funder_award_id":"860630","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G7901872499","display_name":null,"funder_award_id":"Marie","funder_id":"https://openalex.org/F4320338337","funder_display_name":"H2020 Marie Sk\u0142odowska-Curie Actions"},{"id":"https://openalex.org/G7955706205","display_name":null,"funder_award_id":"Horizon 2020","funder_id":"https://openalex.org/F4320338337","funder_display_name":"H2020 Marie Sk\u0142odowska-Curie Actions"},{"id":"https://openalex.org/G8084396017","display_name":null,"funder_award_id":"860630","funder_id":"https://openalex.org/F4320338337","funder_display_name":"H2020 Marie Sk\u0142odowska-Curie Actions"},{"id":"https://openalex.org/G8318064016","display_name":null,"funder_award_id":"Horizon","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"}],"funders":[{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320334679","display_name":"Research Executive Agency","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320338337","display_name":"H2020 Marie Sk\u0142odowska-Curie Actions","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W1819662813","https://openalex.org/W1961345416","https://openalex.org/W1990836268","https://openalex.org/W1999380087","https://openalex.org/W2014352947","https://openalex.org/W2026019770","https://openalex.org/W2100960835","https://openalex.org/W2106100548","https://openalex.org/W2111959010","https://openalex.org/W2116984840","https://openalex.org/W2129018774","https://openalex.org/W2165960883","https://openalex.org/W2166454173","https://openalex.org/W2282821441","https://openalex.org/W2295598076","https://openalex.org/W2392403817","https://openalex.org/W2584805976","https://openalex.org/W2605800822","https://openalex.org/W2799900537","https://openalex.org/W2889357760","https://openalex.org/W2901823434","https://openalex.org/W2954052001","https://openalex.org/W2963104135","https://openalex.org/W2963105378","https://openalex.org/W2972785004","https://openalex.org/W2997591727","https://openalex.org/W3023702633","https://openalex.org/W3032340379","https://openalex.org/W3094948551","https://openalex.org/W3101427066","https://openalex.org/W3105965470","https://openalex.org/W3118480630","https://openalex.org/W3131567681","https://openalex.org/W3135468018","https://openalex.org/W3142848995","https://openalex.org/W3164035696","https://openalex.org/W3181414820","https://openalex.org/W3196884490","https://openalex.org/W3201969467","https://openalex.org/W4212904757","https://openalex.org/W4233413206","https://openalex.org/W4283164653","https://openalex.org/W4283166422","https://openalex.org/W4286910448","https://openalex.org/W4289258088","https://openalex.org/W4298304654","https://openalex.org/W4298401804","https://openalex.org/W4320853929","https://openalex.org/W4393268635","https://openalex.org/W6638208828"],"related_works":["https://openalex.org/W2125652721","https://openalex.org/W1540371141","https://openalex.org/W4231274751","https://openalex.org/W1549363203","https://openalex.org/W2154063878","https://openalex.org/W2556012038","https://openalex.org/W1489772951","https://openalex.org/W3114793362","https://openalex.org/W4229333355","https://openalex.org/W4390437797"],"abstract_inverted_index":{"Past":[0],"research":[1],"has":[2],"demonstrated":[3],"that":[4,49,116,169,180],"the":[5,77,91,97,142,150,159,175],"explicit":[6],"use":[7],"of":[8,33,96,113,177],"protected":[9,38],"attributes":[10,39,195],"in":[11,153],"machine":[12,21,56,78,184],"learning":[13,22,57,79,185],"can":[14,50],"improve":[15,188],"both":[16],"performance":[17,85,189],"and":[18,75,86,93,105,123,141,164],"fairness.":[19,87],"Many":[20],"algorithms,":[23],"however,":[24],"cannot":[25],"directly":[26],"process":[27],"categorical":[28,162,194],"attributes,":[29],"such":[30],"as":[31,47],"country":[32],"birth":[34],"or":[35,67],"ethnicity.":[36],"Because":[37],"frequently":[40],"are":[41],"categorical,":[42],"they":[43],"must":[44],"be":[45,51],"encoded":[46],"features":[48],"input":[52],"to":[53,126,136,149],"a":[54,197],"chosen":[55],"algorithm,":[58],"e.g.":[59],"support":[60],"vector":[61],"machines,":[62],"gradient":[63],"boosting":[64],"decision":[65],"trees":[66],"linear":[68],"models.":[69,128],"Thereby,":[70],"encoding":[71,101,104,121,166,192],"methods":[72,122,168],"influence":[73],"how":[74],"what":[76],"algorithm":[80],"will":[81],"learn,":[82],"affecting":[83],"model":[84],"This":[88],"work":[89],"compares":[90],"accuracy":[92],"fairness":[94],"implications":[95],"two":[98,111],"most":[99],"well-known":[100],"methods:":[102],"one-hot":[103],"target":[106,165],"encoding.":[107],"We":[108,157],"distinguish":[109],"between":[110,161],"types":[112],"induced":[114],"bias":[115],"may":[117,124,181],"arise":[118,182],"from":[119],"these":[120],"lead":[125],"unfair":[127],"The":[129],"first":[130],"type,":[131,144],"irreducible":[132],"bias,":[133,146],"is":[134,147],"due":[135,148],"direct":[137],"group":[138],"category":[139],"discrimination":[140],"second":[143],"reducible":[145],"large":[151],"variance":[152],"statistically":[154],"underrepresented":[155],"groups.":[156],"investigate":[158],"interaction":[160],"encodings":[163],"regularization":[167],"reduce":[170],"unfairness.":[171],"Furthermore,":[172],"we":[173],"consider":[174],"problem":[176],"intersectional":[178],"unfairness":[179],"when":[183],"best":[186],"practices":[187],"measures":[190],"by":[191],"several":[193],"into":[196],"high-cardinality":[198],"feature.":[199]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":3}],"updated_date":"2026-04-13T07:58:08.660418","created_date":"2025-10-10T00:00:00"}
