{"id":"https://openalex.org/W4403919365","doi":"https://doi.org/10.1109/ro-man60168.2024.10731257","title":"Fairness-Sensitive Policy-Gradient Reinforcement Learning for Reducing Bias in Robotic Assistance","display_name":"Fairness-Sensitive Policy-Gradient Reinforcement Learning for Reducing Bias in Robotic Assistance","publication_year":2024,"publication_date":"2024-08-26","ids":{"openalex":"https://openalex.org/W4403919365","doi":"https://doi.org/10.1109/ro-man60168.2024.10731257"},"language":"en","primary_location":{"id":"doi:10.1109/ro-man60168.2024.10731257","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ro-man60168.2024.10731257","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 33rd IEEE International Conference on Robot and Human Interactive Communication (ROMAN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100530911","display_name":"Jie Zhu","orcid":"https://orcid.org/0009-0004-9374-0098"},"institutions":[{"id":"https://openalex.org/I149910238","display_name":"Kent State University","ror":"https://ror.org/049pfb863","country_code":"US","type":"education","lineage":["https://openalex.org/I149910238"]},{"id":"https://openalex.org/I13805885","display_name":"Vaughn College of Aeronautics and Technology","ror":"https://ror.org/056e22e24","country_code":"US","type":"education","lineage":["https://openalex.org/I13805885"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jie Zhu","raw_affiliation_strings":["College of Aeronautics and Engineering, Kent State University,Cognitive Robotics and AI Lab (CRAI),Kent,OH,USA,44240"],"affiliations":[{"raw_affiliation_string":"College of Aeronautics and Engineering, Kent State University,Cognitive Robotics and AI Lab (CRAI),Kent,OH,USA,44240","institution_ids":["https://openalex.org/I13805885","https://openalex.org/I149910238"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111144556","display_name":"Mengsha Hu","orcid":null},"institutions":[{"id":"https://openalex.org/I149910238","display_name":"Kent State University","ror":"https://ror.org/049pfb863","country_code":"US","type":"education","lineage":["https://openalex.org/I149910238"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mengsha Hu","raw_affiliation_strings":["Kent State University,Department of Computer Science"],"affiliations":[{"raw_affiliation_string":"Kent State University,Department of Computer Science","institution_ids":["https://openalex.org/I149910238"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101754385","display_name":"Amy Zhang","orcid":"https://orcid.org/0000-0003-4301-9265"},"institutions":[{"id":"https://openalex.org/I13805885","display_name":"Vaughn College of Aeronautics and Technology","ror":"https://ror.org/056e22e24","country_code":"US","type":"education","lineage":["https://openalex.org/I13805885"]},{"id":"https://openalex.org/I149910238","display_name":"Kent State University","ror":"https://ror.org/049pfb863","country_code":"US","type":"education","lineage":["https://openalex.org/I149910238"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Amy Zhang","raw_affiliation_strings":["College of Aeronautics and Engineering, Kent State University,Cognitive Robotics and AI Lab (CRAI),Kent,OH,USA,44240"],"affiliations":[{"raw_affiliation_string":"College of Aeronautics and Engineering, Kent State University,Cognitive Robotics and AI Lab (CRAI),Kent,OH,USA,44240","institution_ids":["https://openalex.org/I13805885","https://openalex.org/I149910238"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103270436","display_name":"Ruoming Jin","orcid":"https://orcid.org/0000-0003-1895-4243"},"institutions":[{"id":"https://openalex.org/I149910238","display_name":"Kent State University","ror":"https://ror.org/049pfb863","country_code":"US","type":"education","lineage":["https://openalex.org/I149910238"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ruoming Jin","raw_affiliation_strings":["Kent State University,Department of Computer Science"],"affiliations":[{"raw_affiliation_string":"Kent State University,Department of Computer Science","institution_ids":["https://openalex.org/I149910238"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100448453","display_name":"Rui Liu","orcid":"https://orcid.org/0000-0002-2842-3860"},"institutions":[{"id":"https://openalex.org/I13805885","display_name":"Vaughn College of Aeronautics and Technology","ror":"https://ror.org/056e22e24","country_code":"US","type":"education","lineage":["https://openalex.org/I13805885"]},{"id":"https://openalex.org/I149910238","display_name":"Kent State University","ror":"https://ror.org/049pfb863","country_code":"US","type":"education","lineage":["https://openalex.org/I149910238"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rui Liu","raw_affiliation_strings":["College of Aeronautics and Engineering, Kent State University,Cognitive Robotics and AI Lab (CRAI),Kent,OH,USA,44240"],"affiliations":[{"raw_affiliation_string":"College of Aeronautics and Engineering, Kent State University,Cognitive Robotics and AI Lab (CRAI),Kent,OH,USA,44240","institution_ids":["https://openalex.org/I13805885","https://openalex.org/I149910238"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100530911"],"corresponding_institution_ids":["https://openalex.org/I13805885","https://openalex.org/I149910238"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.23215322,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"549","last_page":"554"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.9009000062942505,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.9009000062942505,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8338155746459961},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6290298700332642},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4662778377532959},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.4643236994743347},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.13338863849639893},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.06530794501304626}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8338155746459961},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6290298700332642},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4662778377532959},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.4643236994743347},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.13338863849639893},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.06530794501304626}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ro-man60168.2024.10731257","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ro-man60168.2024.10731257","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 33rd IEEE International Conference on Robot and Human Interactive Communication (ROMAN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W1977177161","https://openalex.org/W2029449366","https://openalex.org/W2057882064","https://openalex.org/W2095932468","https://openalex.org/W2100960835","https://openalex.org/W2116984840","https://openalex.org/W2158406371","https://openalex.org/W2295124130","https://openalex.org/W2530395818","https://openalex.org/W2736601468","https://openalex.org/W2753845591","https://openalex.org/W2760062370","https://openalex.org/W2909852956","https://openalex.org/W3092541244","https://openalex.org/W3118295647","https://openalex.org/W3120485916","https://openalex.org/W3134063474","https://openalex.org/W3135927599","https://openalex.org/W3138206886","https://openalex.org/W3177313640","https://openalex.org/W3181414820","https://openalex.org/W4230563027","https://openalex.org/W4287077603","https://openalex.org/W4288347276","https://openalex.org/W4312940830","https://openalex.org/W6728551298","https://openalex.org/W6741002519","https://openalex.org/W6744110554","https://openalex.org/W6746696776","https://openalex.org/W6748382702","https://openalex.org/W6748989285","https://openalex.org/W6763157893","https://openalex.org/W6765002771","https://openalex.org/W6791806579","https://openalex.org/W6796617203","https://openalex.org/W6798345263","https://openalex.org/W6798596300"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W2920061524","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856"],"abstract_inverted_index":{"Robots":[0],"assist":[1],"humans":[2,131],"in":[3,122,140],"various":[4],"activities,":[5],"from":[6],"daily":[7],"living":[8],"to":[9,80,104],"collaborative":[10],"manufacturing.":[11],"Because":[12],"they":[13],"have":[14,25],"biased":[15,86],"learning":[16],"sources":[17],"(e.g.,":[18,31],"data,":[19],"demonstrations,":[20,135],"human":[21],"feedback),":[22],"robots":[23,82],"inevitably":[24],"discriminatory":[26,36],"performance":[27,37],"regarding":[28],"individual":[29],"differences":[30],"skin":[32],"color,":[33],"mobility,":[34],"appearance);":[35],"will":[38],"undermine":[39],"robots\u2019":[40],"service":[41,116,134],"quality,":[42],"causes":[43],"request":[44],"ignorance":[45],"and":[46,49,84,99,132],"response":[47],"delay,":[48],"even":[50],"cause":[51],"emotional":[52],"offenses.":[53],"Therefore,":[54],"mitigating":[55],"biases":[56],"is":[57],"critically":[58],"important":[59],"for":[60],"delivering":[61],"fair":[62,106],"robotic":[63],"services.":[64,145],"In":[65],"this":[66],"paper,":[67],"we":[68,112],"design":[69],"a":[70,114,118,123,126],"bias-mitigation":[71],"method":[72],"\u2013":[73],"Fairness-Sensitive":[74],"Policy":[75],"Gradient":[76],"Reinforcement":[77],"Learning":[78],"(FSPGRL),":[79],"help":[81],"self-identify":[83],"correct":[85],"behaviors.":[87],"FSP-GRL":[88],"identifies":[89],"bias":[90],"by":[91],"examining":[92],"the":[93,101],"abnormal":[94],"updates":[95,100],"along":[96],"particular":[97],"gradients":[98],"policy":[102],"network":[103],"provide":[105],"decisions.":[107],"To":[108],"validate":[109],"FSPGRL\u2019s":[110],"effectiveness,":[111],"designed":[113],"human-centered":[115],"scenario:":[117],"robot":[119,144],"serving":[120],"people":[121],"restaurant.":[124],"With":[125],"user":[127],"study":[128],"involving":[129],"24":[130],"1,000":[133],"FSPGRL":[136],"has":[137],"proven":[138],"effective":[139],"maintaining":[141],"fairness":[142],"during":[143]},"counts_by_year":[],"updated_date":"2025-12-22T23:10:17.713674","created_date":"2025-10-10T00:00:00"}
