{"id":"https://openalex.org/W4409749370","doi":"https://doi.org/10.1145/3706598.3713217","title":"Investigating the Capabilities and Limitations of Machine Learning for Identifying Bias in English Language Data with Information and Heritage Professionals","display_name":"Investigating the Capabilities and Limitations of Machine Learning for Identifying Bias in English Language Data with Information and Heritage Professionals","publication_year":2025,"publication_date":"2025-04-24","ids":{"openalex":"https://openalex.org/W4409749370","doi":"https://doi.org/10.1145/3706598.3713217"},"language":"en","primary_location":{"id":"doi:10.1145/3706598.3713217","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3706598.3713217","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 CHI Conference on Human Factors in Computing Systems","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2504.00860","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032893302","display_name":"Lucy Havens","orcid":"https://orcid.org/0000-0001-8158-6039"},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Lucy Havens","raw_affiliation_strings":["University of Edinburgh, Edinburgh, United Kingdom"],"raw_orcid":"https://orcid.org/0000-0001-8158-6039","affiliations":[{"raw_affiliation_string":"University of Edinburgh, Edinburgh, United Kingdom","institution_ids":["https://openalex.org/I98677209"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048194226","display_name":"Benjamin Bach","orcid":"https://orcid.org/0000-0002-9201-7744"},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Benjamin Bach","raw_affiliation_strings":["Inria, Bordeaux, France and University of Edinburgh, Edinburgh, United Kingdom"],"raw_orcid":"https://orcid.org/0000-0002-9201-7744","affiliations":[{"raw_affiliation_string":"Inria, Bordeaux, France and University of Edinburgh, Edinburgh, United Kingdom","institution_ids":["https://openalex.org/I98677209"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033582512","display_name":"Melissa Terras","orcid":"https://orcid.org/0000-0001-6496-3197"},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Melissa Terras","raw_affiliation_strings":["University of Edinburgh, Edinburgh, United Kingdom"],"raw_orcid":"https://orcid.org/0000-0001-6496-3197","affiliations":[{"raw_affiliation_string":"University of Edinburgh, Edinburgh, United Kingdom","institution_ids":["https://openalex.org/I98677209"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043179000","display_name":"Beatrice Alex","orcid":"https://orcid.org/0000-0002-7279-1476"},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Beatrice Alex","raw_affiliation_strings":["University of Edinburgh, Edinburgh, United Kingdom"],"raw_orcid":"https://orcid.org/0000-0002-7279-1476","affiliations":[{"raw_affiliation_string":"University of Edinburgh, Edinburgh, United Kingdom","institution_ids":["https://openalex.org/I98677209"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5032893302"],"corresponding_institution_ids":["https://openalex.org/I98677209"],"apc_list":null,"apc_paid":null,"fwci":2.057,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.8761622,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"22"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9824000000953674,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9824000000953674,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9764999747276306,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9545999765396118,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6798931360244751},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.45395416021347046},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.45111775398254395},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3700379729270935},{"id":"https://openalex.org/keywords/knowledge-management","display_name":"Knowledge management","score":0.3334578573703766}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6798931360244751},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.45395416021347046},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.45111775398254395},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3700379729270935},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.3334578573703766}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3706598.3713217","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3706598.3713217","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 CHI Conference on Human Factors in Computing Systems","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2504.00860","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2504.00860","pdf_url":"https://arxiv.org/pdf/2504.00860","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:HAL:hal-05117618v1","is_oa":true,"landing_page_url":"https://hal.science/hal-05117618","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"CHI 2025 - CHI Conference on Human Factors in Computing Systems, Apr 2025, Yokohama, Japan. pp.1-22, &#x27E8;10.1145/3706598.3713217&#x27E9;","raw_type":"Conference papers"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2504.00860","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2504.00860","pdf_url":"https://arxiv.org/pdf/2504.00860","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320314731","display_name":"UK Research and Innovation","ror":"https://ror.org/001aqnf71"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":121,"referenced_works":["https://openalex.org/W1119960297","https://openalex.org/W1527349555","https://openalex.org/W1563482706","https://openalex.org/W1761704792","https://openalex.org/W1971670344","https://openalex.org/W1991192911","https://openalex.org/W2005061283","https://openalex.org/W2007619812","https://openalex.org/W2034598596","https://openalex.org/W2038728174","https://openalex.org/W2067436631","https://openalex.org/W2067945973","https://openalex.org/W2071653415","https://openalex.org/W2126064827","https://openalex.org/W2128385741","https://openalex.org/W2143017621","https://openalex.org/W2146691185","https://openalex.org/W2150634379","https://openalex.org/W2180404376","https://openalex.org/W2337002970","https://openalex.org/W2467823181","https://openalex.org/W2483309689","https://openalex.org/W2493916176","https://openalex.org/W2603039744","https://openalex.org/W2738411409","https://openalex.org/W2740168486","https://openalex.org/W2788241675","https://openalex.org/W2898731212","https://openalex.org/W2899136066","https://openalex.org/W2920114910","https://openalex.org/W2942160782","https://openalex.org/W2945776595","https://openalex.org/W2950888501","https://openalex.org/W2963526187","https://openalex.org/W2982521860","https://openalex.org/W2999765337","https://openalex.org/W3000952406","https://openalex.org/W3004505508","https://openalex.org/W3020325112","https://openalex.org/W3034515982","https://openalex.org/W3037831233","https://openalex.org/W3044199925","https://openalex.org/W3044663232","https://openalex.org/W3047579825","https://openalex.org/W3097185012","https://openalex.org/W3098998028","https://openalex.org/W3102708241","https://openalex.org/W3104617516","https://openalex.org/W3104847483","https://openalex.org/W3117072286","https://openalex.org/W3119746452","https://openalex.org/W3123374861","https://openalex.org/W3135367826","https://openalex.org/W3135514117","https://openalex.org/W3146083582","https://openalex.org/W3166727371","https://openalex.org/W3168771811","https://openalex.org/W3173721282","https://openalex.org/W3174220540","https://openalex.org/W3177189402","https://openalex.org/W3181414820","https://openalex.org/W3188554804","https://openalex.org/W3196053885","https://openalex.org/W3196064594","https://openalex.org/W3197587259","https://openalex.org/W3198864673","https://openalex.org/W3207608052","https://openalex.org/W3212464620","https://openalex.org/W4210736086","https://openalex.org/W4210764005","https://openalex.org/W4210870651","https://openalex.org/W4213145388","https://openalex.org/W4214943962","https://openalex.org/W4220752914","https://openalex.org/W4224251572","https://openalex.org/W4226145682","https://openalex.org/W4235852123","https://openalex.org/W4239649351","https://openalex.org/W4240458495","https://openalex.org/W4242918116","https://openalex.org/W4244021162","https://openalex.org/W4248308225","https://openalex.org/W4249335113","https://openalex.org/W4253834041","https://openalex.org/W4254765313","https://openalex.org/W4255778550","https://openalex.org/W4256652306","https://openalex.org/W4256667956","https://openalex.org/W4281914077","https://openalex.org/W4285288507","https://openalex.org/W4285388465","https://openalex.org/W4285436127","https://openalex.org/W4287855119","https://openalex.org/W4287887504","https://openalex.org/W4287890642","https://openalex.org/W4288083800","https://openalex.org/W4288359825","https://openalex.org/W4301416904","https://openalex.org/W4307062131","https://openalex.org/W4321276891","https://openalex.org/W4323051415","https://openalex.org/W4365388135","https://openalex.org/W4366390744","https://openalex.org/W4366550901","https://openalex.org/W4376167053","https://openalex.org/W4380365974","https://openalex.org/W4383175668","https://openalex.org/W4385573886","https://openalex.org/W4385973770","https://openalex.org/W4386566641","https://openalex.org/W4386566763","https://openalex.org/W4388229648","https://openalex.org/W4392214583","https://openalex.org/W4392910123","https://openalex.org/W4396811641","https://openalex.org/W4396832613","https://openalex.org/W4401947350","https://openalex.org/W4403315440","https://openalex.org/W4403434698","https://openalex.org/W4404783416","https://openalex.org/W4410301798"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Despite":[0],"numerous":[1],"efforts":[2],"to":[3,10,50,56,63,96,105,122,126,134],"mitigate":[4],"their":[5],"biases,":[6],"ML":[7,16,45,91,124,147],"systems":[8],"continue":[9],"harm":[11],"already-marginalized":[12],"people.":[13],"While":[14],"predominant":[15],"approaches":[17,104,125],"assume":[18],"bias":[19,46,94,127,140],"can":[20,26,108],"be":[21,27],"removed":[22],"and":[23,82,111,115,128],"fair":[24],"models":[25,49,73],"created,":[28],"we":[29,70],"show":[30],"that":[31],"these":[32],"are":[33],"not":[34],"always":[35],"possible,":[36],"nor":[37],"desirable,":[38],"goals.":[39],"We":[40,118],"reframe":[41],"the":[42,72,88,100,120,136],"problem":[43],"of":[44,80,90,138],"by":[47],"creating":[48],"identify":[51],"biased":[52],"language,":[53],"drawing":[54],"attention":[55],"a":[57,68,75,131,145],"dataset's":[58],"biases":[59],"rather":[60],"than":[61],"trying":[62],"remove":[64],"them.":[65],"Then,":[66],"through":[67],"workshop,":[69],"evaluated":[71],"for":[74,92],"specific":[76],"use":[77,148],"case:":[78],"workflows":[79],"information":[81],"heritage":[83],"professionals.":[84],"Our":[85],"findings":[86],"demonstrate":[87,119],"limitations":[89],"identifying":[93],"due":[95],"its":[97,116],"contextual":[98],"nature,":[99],"way":[101],"in":[102,144],"which":[103],"mitigating":[106],"it":[107],"simultaneously":[109],"privilege":[110],"oppress":[112],"different":[113],"communities,":[114],"inevitability.":[117],"need":[121],"expand":[123],"fairness,":[129],"providing":[130],"mixed-methods":[132],"approach":[133],"investigating":[135],"feasibility":[137],"removing":[139],"or":[141],"achieving":[142],"fairness":[143],"given":[146],"case.":[149]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-05-07T13:39:58.223016","created_date":"2025-10-10T00:00:00"}
