{"id":"https://openalex.org/W4406052131","doi":"https://doi.org/10.48550/arxiv.2501.00129","title":"A Data-Centric Approach to Detecting and Mitigating Demographic Bias in Pediatric Mental Health Text: A Case Study in Anxiety Detection","display_name":"A Data-Centric Approach to Detecting and Mitigating Demographic Bias in Pediatric Mental Health Text: A Case Study in Anxiety Detection","publication_year":2024,"publication_date":"2024-12-30","ids":{"openalex":"https://openalex.org/W4406052131","doi":"https://doi.org/10.48550/arxiv.2501.00129"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2501.00129","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.00129","pdf_url":"https://arxiv.org/pdf/2501.00129","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2501.00129","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5021442709","display_name":"Julia Ive","orcid":"https://orcid.org/0000-0002-3931-3392"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ive, Julia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034410008","display_name":"Paulina Bondaronek","orcid":"https://orcid.org/0000-0003-0096-1234"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bondaronek, Paulina","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101517397","display_name":"Vishal Yadav","orcid":"https://orcid.org/0000-0003-1506-8991"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yadav, Vishal","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017444979","display_name":"Daniel Santel","orcid":"https://orcid.org/0000-0002-6495-8328"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Santel, Daniel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002880520","display_name":"Tracy A. Glauser","orcid":"https://orcid.org/0000-0003-1520-2732"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Glauser, Tracy","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068305321","display_name":"Tina L. Cheng","orcid":"https://orcid.org/0000-0002-2053-1402"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cheng, Tina","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010194987","display_name":"Jeffrey R. Strawn","orcid":"https://orcid.org/0000-0002-7526-2641"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Strawn, Jeffrey R.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066366608","display_name":"Greeshma Agasthya","orcid":"https://orcid.org/0000-0002-2301-5964"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Agasthya, Greeshma","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115920506","display_name":"Jordan Tschida","orcid":"https://orcid.org/0000-0002-1359-4165"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tschida, Jordan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034106271","display_name":"Sanghyun Choo","orcid":"https://orcid.org/0000-0002-8884-3437"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Choo, Sanghyun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087960600","display_name":"Mayanka Chandrashekar","orcid":"https://orcid.org/0000-0002-3697-5972"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chandrashekar, Mayanka","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078132584","display_name":"Anuj Kapadia","orcid":"https://orcid.org/0000-0003-2755-4495"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kapadia, Anuj J.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5057902242","display_name":"John Pestian","orcid":"https://orcid.org/0000-0001-5998-249X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pestian, John","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":13,"corresponding_author_ids":["https://openalex.org/A5021442709"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10762","display_name":"Migration, Health and Trauma","score":0.8772000074386597,"subfield":{"id":"https://openalex.org/subfields/3203","display_name":"Clinical Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10762","display_name":"Migration, Health and Trauma","score":0.8772000074386597,"subfield":{"id":"https://openalex.org/subfields/3203","display_name":"Clinical Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13883","display_name":"Child and Adolescent Health","score":0.876800000667572,"subfield":{"id":"https://openalex.org/subfields/3600","display_name":"General Health Professions"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.7473999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/anxiety","display_name":"Anxiety","score":0.7309362888336182},{"id":"https://openalex.org/keywords/mental-health","display_name":"Mental health","score":0.6821005344390869},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.5279285907745361},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.39944693446159363},{"id":"https://openalex.org/keywords/clinical-psychology","display_name":"Clinical psychology","score":0.34885546565055847},{"id":"https://openalex.org/keywords/psychiatry","display_name":"Psychiatry","score":0.3101074993610382},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.2902265191078186}],"concepts":[{"id":"https://openalex.org/C558461103","wikidata":"https://www.wikidata.org/wiki/Q154430","display_name":"Anxiety","level":2,"score":0.7309362888336182},{"id":"https://openalex.org/C134362201","wikidata":"https://www.wikidata.org/wiki/Q317309","display_name":"Mental health","level":2,"score":0.6821005344390869},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.5279285907745361},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.39944693446159363},{"id":"https://openalex.org/C70410870","wikidata":"https://www.wikidata.org/wiki/Q199906","display_name":"Clinical psychology","level":1,"score":0.34885546565055847},{"id":"https://openalex.org/C118552586","wikidata":"https://www.wikidata.org/wiki/Q7867","display_name":"Psychiatry","level":1,"score":0.3101074993610382},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.2902265191078186}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2501.00129","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.00129","pdf_url":"https://arxiv.org/pdf/2501.00129","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2501.00129","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2501.00129","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2501.00129","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.00129","pdf_url":"https://arxiv.org/pdf/2501.00129","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1645119126","display_name":null,"funder_award_id":"AC05-00OR22725","funder_id":"https://openalex.org/F4320306084","funder_display_name":"U.S. Department of Energy"},{"id":"https://openalex.org/G1719536385","display_name":null,"funder_award_id":"DE-AC05-00OR22725","funder_id":"https://openalex.org/F4320306084","funder_display_name":"U.S. Department of Energy"},{"id":"https://openalex.org/G5726405315","display_name":null,"funder_award_id":"DE-AC05","funder_id":"https://openalex.org/F4320306250","funder_display_name":"Battelle"},{"id":"https://openalex.org/G6129992089","display_name":null,"funder_award_id":"DE-AC05-","funder_id":"https://openalex.org/F4320316892","funder_display_name":"UT-Battelle"},{"id":"https://openalex.org/G6864165199","display_name":null,"funder_award_id":"DE-AC05-00OR22725","funder_id":"https://openalex.org/F4320306250","funder_display_name":"Battelle"},{"id":"https://openalex.org/G7995982022","display_name":null,"funder_award_id":"DE-AC05","funder_id":"https://openalex.org/F4320306084","funder_display_name":"U.S. Department of Energy"},{"id":"https://openalex.org/G8813984943","display_name":null,"funder_award_id":"DE-AC05-00OR22725","funder_id":"https://openalex.org/F4320316892","funder_display_name":"UT-Battelle"},{"id":"https://openalex.org/G8906985441","display_name":null,"funder_award_id":"00OR22725","funder_id":"https://openalex.org/F4320306084","funder_display_name":"U.S. Department of Energy"},{"id":"https://openalex.org/G8943143067","display_name":null,"funder_award_id":"AC05-00OR22725","funder_id":"https://openalex.org/F4320316892","funder_display_name":"UT-Battelle"}],"funders":[{"id":"https://openalex.org/F4320306084","display_name":"U.S. Department of Energy","ror":"https://ror.org/01bj3aw27"},{"id":"https://openalex.org/F4320306250","display_name":"Battelle","ror":"https://ror.org/01h5tnr73"},{"id":"https://openalex.org/F4320309575","display_name":"Cincinnati Children's Hospital Medical Center","ror":"https://ror.org/01hcyya48"},{"id":"https://openalex.org/F4320316892","display_name":"UT-Battelle","ror":"https://ror.org/04nza6677"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4406052131.pdf","grobid_xml":"https://content.openalex.org/works/W4406052131.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2358430072","https://openalex.org/W1985838049","https://openalex.org/W3089724416","https://openalex.org/W2013157839","https://openalex.org/W2111463896","https://openalex.org/W1551113066","https://openalex.org/W4210836443","https://openalex.org/W1972101794","https://openalex.org/W3139055845","https://openalex.org/W2416006987"],"abstract_inverted_index":{"Introduction:":[0],"Healthcare":[1],"AI":[2,45,256],"models":[3,46,258],"often":[4],"inherit":[5],"biases":[6],"from":[7],"their":[8],"training":[9,42],"data.":[10,26,92],"While":[11],"efforts":[12],"have":[13],"primarily":[14],"targeted":[15],"bias":[16,64,75,206,254],"in":[17,40,50,136,171,177,214,255],"structured":[18],"data,":[19],"mental":[20,52,89],"health":[21,53,90],"heavily":[22],"depends":[23],"on":[24,116,129,185,242,260],"unstructured":[25],"This":[27,125],"study":[28],"aims":[29],"to":[30,37,48,59,73,83,164,169,209,227],"detect":[31],"and":[32,81,101,155,174,190,239],"mitigate":[33],"linguistic":[34,175,191],"differences":[35,39,176],"related":[36],"non-biological":[38],"the":[41,61],"data":[43],"of":[44,63,146],"designed":[47],"assist":[49],"pediatric":[51,137],"screening.":[54],"Our":[55,140],"objectives":[56],"are:":[57],"(1)":[58],"assess":[60],"presence":[62],"by":[65,207],"evaluating":[66],"outcome":[67],"parity":[68,97],"across":[69,98,217],"sex":[70],"subgroups,":[71],"(2)":[72],"identify":[74],"sources":[76],"through":[77],"textual":[78],"distribution":[79],"analysis,":[80],"(3)":[82],"develop":[84],"a":[85,130,143,151,156,223],"de-biasing":[86,111,202,225],"method":[87,112],"for":[88,132,181,252],"text":[91],"Methods:":[93],"We":[94,221],"examined":[95],"classification":[96],"demographic":[99,218],"groups":[100],"assessed":[102],"how":[103],"gendered":[104],"language":[105,238],"influences":[106],"model":[107,131],"predictions.":[108],"A":[109],"data-centric":[110,224],"was":[113,127],"applied,":[114],"focusing":[115],"neutralizing":[117,236],"biased":[118,237],"terms":[119],"while":[120],"retaining":[121],"salient":[122],"clinical":[123,233],"information.":[124],"methodology":[126],"tested":[128],"automatic":[133],"anxiety":[134],"detection":[135],"patients.":[138],"Results:":[139],"findings":[141],"revealed":[142],"systematic":[144],"under-diagnosis":[145],"female":[147],"adolescent":[148],"patients,":[149,166],"with":[150],"4%":[152],"lower":[153],"accuracy":[154],"9%":[157],"higher":[158],"False":[159],"Negative":[160],"Rate":[161],"(FNR)":[162],"compared":[163],"male":[165,182],"likely":[167],"due":[168],"disparities":[170,231],"information":[172],"density":[173],"patient":[178],"notes.":[179],"Notes":[180],"patients":[183],"were":[184],"average":[186],"500":[187],"words":[188],"longer,":[189],"similarity":[192],"metrics":[193],"indicated":[194],"distinct":[195],"word":[196],"distributions":[197],"between":[198],"genders.":[199],"Implementing":[200],"our":[201,246],"approach":[203,247],"reduced":[204],"diagnostic":[205],"up":[208],"27%,":[210],"demonstrating":[211],"its":[212],"effectiveness":[213],"enhancing":[215,240],"equity":[216],"groups.":[219],"Discussion:":[220],"developed":[222],"framework":[226],"address":[228],"gender-based":[229],"content":[230],"within":[232],"text.":[234,261],"By":[235],"focus":[241],"clinically":[243],"essential":[244],"information,":[245],"demonstrates":[248],"an":[249],"effective":[250],"strategy":[251],"mitigating":[253],"healthcare":[257],"trained":[259]},"counts_by_year":[],"updated_date":"2026-05-15T08:27:34.491423","created_date":"2025-01-04T00:00:00"}
