{"id":"https://openalex.org/W4318147609","doi":"https://doi.org/10.1109/bigdata55660.2022.10021078","title":"Identifying Imbalance Thresholds in Input Data to Achieve Desired Levels of Algorithmic Fairness","display_name":"Identifying Imbalance Thresholds in Input Data to Achieve Desired Levels of Algorithmic Fairness","publication_year":2022,"publication_date":"2022-12-17","ids":{"openalex":"https://openalex.org/W4318147609","doi":"https://doi.org/10.1109/bigdata55660.2022.10021078"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata55660.2022.10021078","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/bigdata55660.2022.10021078","pdf_url":null,"source":{"id":"https://openalex.org/S4363607709","display_name":"2022 IEEE International Conference on Big Data (Big Data)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5062299333","display_name":"Mariachiara Mecati","orcid":"https://orcid.org/0000-0002-0041-1809"},"institutions":[{"id":"https://openalex.org/I177477856","display_name":"Politecnico di Torino","ror":"https://ror.org/00bgk9508","country_code":"IT","type":"education","lineage":["https://openalex.org/I177477856"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Mariachiara Mecati","raw_affiliation_strings":["Politecnico di Torino,Torino,Italy","Politecnico di Torino, Torino, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Politecnico di Torino,Torino,Italy","institution_ids":["https://openalex.org/I177477856"]},{"raw_affiliation_string":"Politecnico di Torino, Torino, Italy","institution_ids":["https://openalex.org/I177477856"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088188170","display_name":"Andrea Adrignola","orcid":null},"institutions":[{"id":"https://openalex.org/I177477856","display_name":"Politecnico di Torino","ror":"https://ror.org/00bgk9508","country_code":"IT","type":"education","lineage":["https://openalex.org/I177477856"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Andrea Adrignola","raw_affiliation_strings":["Politecnico di Torino,Torino,Italy","Politecnico di Torino, Torino, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Politecnico di Torino,Torino,Italy","institution_ids":["https://openalex.org/I177477856"]},{"raw_affiliation_string":"Politecnico di Torino, Torino, Italy","institution_ids":["https://openalex.org/I177477856"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047965231","display_name":"Antonio Vetr\u00f2","orcid":"https://orcid.org/0000-0003-2027-3308"},"institutions":[{"id":"https://openalex.org/I177477856","display_name":"Politecnico di Torino","ror":"https://ror.org/00bgk9508","country_code":"IT","type":"education","lineage":["https://openalex.org/I177477856"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Antonio Vetro","raw_affiliation_strings":["Politecnico di Torino,Torino,Italy","Politecnico di Torino, Torino, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Politecnico di Torino,Torino,Italy","institution_ids":["https://openalex.org/I177477856"]},{"raw_affiliation_string":"Politecnico di Torino, Torino, Italy","institution_ids":["https://openalex.org/I177477856"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015536188","display_name":"Marco Torchiano","orcid":"https://orcid.org/0000-0001-5328-368X"},"institutions":[{"id":"https://openalex.org/I177477856","display_name":"Politecnico di Torino","ror":"https://ror.org/00bgk9508","country_code":"IT","type":"education","lineage":["https://openalex.org/I177477856"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Marco Torchiano","raw_affiliation_strings":["Politecnico di Torino,Torino,Italy","Politecnico di Torino, Torino, Italy"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Politecnico di Torino,Torino,Italy","institution_ids":["https://openalex.org/I177477856"]},{"raw_affiliation_string":"Politecnico di Torino, Torino, Italy","institution_ids":["https://openalex.org/I177477856"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.20312748,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"12","issue":null,"first_page":"4700","last_page":"4709"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9812999963760376,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9812999963760376,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.977400004863739,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9764000177383423,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7379368543624878},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.6421375274658203},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.5766441822052002},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5491837859153748},{"id":"https://openalex.org/keywords/automation","display_name":"Automation","score":0.5131000280380249},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.500417947769165},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.49665671586990356},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4269470274448395},{"id":"https://openalex.org/keywords/risk-analysis","display_name":"Risk analysis (engineering)","score":0.42236363887786865},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.33658313751220703},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08913809061050415}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7379368543624878},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.6421375274658203},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.5766441822052002},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5491837859153748},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.5131000280380249},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.500417947769165},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.49665671586990356},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4269470274448395},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.42236363887786865},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33658313751220703},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08913809061050415},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata55660.2022.10021078","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/bigdata55660.2022.10021078","pdf_url":null,"source":{"id":"https://openalex.org/S4363607709","display_name":"2022 IEEE International Conference on Big Data (Big Data)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.5400000214576721},{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.41999998688697815}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W2006447892","https://openalex.org/W2338318698","https://openalex.org/W2764072425","https://openalex.org/W2992899357","https://openalex.org/W3038247645","https://openalex.org/W3042675867","https://openalex.org/W3099562911","https://openalex.org/W3196834332","https://openalex.org/W3202934978","https://openalex.org/W4205283541","https://openalex.org/W4226094784","https://openalex.org/W4288617757","https://openalex.org/W4289878260","https://openalex.org/W6780221099","https://openalex.org/W6802019065"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W4224009465","https://openalex.org/W4286629047","https://openalex.org/W4306321456","https://openalex.org/W4285260836","https://openalex.org/W3046775127","https://openalex.org/W3170094116","https://openalex.org/W4205958290","https://openalex.org/W2808699638"],"abstract_inverted_index":{"Software":[0],"bias":[1],"has":[2],"emerged":[3],"as":[4,59,77],"a":[5,22,60,69,90,139],"relevant":[6],"issue":[7],"in":[8,12,21,34,57],"the":[9,15,37,47,87,112,117,130,153,156],"latest":[10],"years,":[11],"conjunction":[13],"with":[14,96],"increasing":[16],"adoption":[17],"of":[18,24,29,39,46,81,93,105,119,155],"software":[19,40,64,143],"automation":[20],"variety":[23],"organizational":[25],"and":[26,32,100,162,171],"production":[27],"processes":[28],"our":[30],"society,":[31],"especially":[33],"decision-making.":[35],"Among":[36],"causes":[38],"bias,":[41],"data":[42,94],"imbalance":[43,56],"is":[44,160],"one":[45],"most":[48],"significant":[49],"issues.":[50],"In":[51,122],"this":[52],"paper,":[53],"we":[54,67],"treat":[55],"datasets":[58],"risk":[61,79,118],"factor":[62],"for":[63,74],"bias.":[65],"Specifically,":[66],"define":[68],"methodology":[70,88,159],"to":[71,89,128,138,150,167],"identify":[72,116],"thresholds":[73,113],"balance":[75],"measures":[76],"meaningful":[78],"indicators":[80],"unfair":[82,120],"classification":[83,98],"output.":[84,121],"We":[85],"apply":[86],"large":[91],"number":[92],"mutations":[95],"different":[97,168],"tasks":[99],"tested":[101],"all":[102],"possible":[103],"combinations":[104],"balance-unfairness-algorithm.The":[106],"results":[107],"show":[108],"that":[109],"on":[110],"average":[111],"can":[114,164],"accurately":[115],"certain":[123],"cases":[124],"they":[125],"even":[126],"tend":[127],"overestimate":[129],"risk:":[131],"although":[132],"such":[133],"behavior":[134],"could":[135],"be":[136,148,165],"instrumental":[137],"prudential":[140],"approach":[141],"towards":[142],"discrimination,":[144],"further":[145],"work":[146],"will":[147],"devoted":[149],"better":[151],"assess":[152],"reliability":[154],"thresholds.The":[157],"proposed":[158],"generic":[161],"it":[163],"applied":[166],"datasets,":[169],"algorithms,":[170],"context-specific":[172],"thresholds.":[173]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
