{"id":"https://openalex.org/W4416036342","doi":"https://doi.org/10.18653/v1/2025.emnlp-main.818","title":"PakBBQ: A Culturally Adapted Bias Benchmark for QA","display_name":"PakBBQ: A Culturally Adapted Bias Benchmark for QA","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4416036342","doi":"https://doi.org/10.18653/v1/2025.emnlp-main.818"},"language":null,"primary_location":{"id":"doi:10.18653/v1/2025.emnlp-main.818","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.818","pdf_url":"https://aclanthology.org/2025.emnlp-main.818.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2025.emnlp-main.818.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120309061","display_name":"Abdullah Hashmat","orcid":null},"institutions":[{"id":"https://openalex.org/I207789805","display_name":"Lahore University of Management Sciences","ror":"https://ror.org/05b5x4a35","country_code":"PK","type":"education","lineage":["https://openalex.org/I207789805"]}],"countries":["PK"],"is_corresponding":true,"raw_author_name":"Abdullah Hashmat","raw_affiliation_strings":["Lahore University of Management Sciences Lahore , Pakistan"],"affiliations":[{"raw_affiliation_string":"Lahore University of Management Sciences Lahore , Pakistan","institution_ids":["https://openalex.org/I207789805"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113181018","display_name":"M. Jehanzeb Mirza","orcid":null},"institutions":[{"id":"https://openalex.org/I207789805","display_name":"Lahore University of Management Sciences","ror":"https://ror.org/05b5x4a35","country_code":"PK","type":"education","lineage":["https://openalex.org/I207789805"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Muhammad Arham Mirza","raw_affiliation_strings":["Lahore University of Management Sciences Lahore , Pakistan"],"affiliations":[{"raw_affiliation_string":"Lahore University of Management Sciences Lahore , Pakistan","institution_ids":["https://openalex.org/I207789805"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038004767","display_name":"Agha Ali Raza","orcid":"https://orcid.org/0000-0003-0124-9783"},"institutions":[{"id":"https://openalex.org/I207789805","display_name":"Lahore University of Management Sciences","ror":"https://ror.org/05b5x4a35","country_code":"PK","type":"education","lineage":["https://openalex.org/I207789805"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Agha Ali Raza","raw_affiliation_strings":["Lahore University of Management Sciences Lahore , Pakistan"],"affiliations":[{"raw_affiliation_string":"Lahore University of Management Sciences Lahore , Pakistan","institution_ids":["https://openalex.org/I207789805"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5120309061"],"corresponding_institution_ids":["https://openalex.org/I207789805"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.1842985,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"16171","last_page":"16183"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.0625,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.0625,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.03590000048279762,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10826","display_name":"Behavioral and Psychological Studies","score":0.01850000023841858,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/formality","display_name":"Formality","score":0.675000011920929},{"id":"https://openalex.org/keywords/framing","display_name":"Framing (construction)","score":0.5863999724388123},{"id":"https://openalex.org/keywords/cultural-bias","display_name":"Cultural bias","score":0.5109999775886536},{"id":"https://openalex.org/keywords/framing-effect","display_name":"Framing effect","score":0.4902999997138977},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.46309998631477356},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.35569998621940613},{"id":"https://openalex.org/keywords/confirmation-bias","display_name":"Confirmation bias","score":0.35010001063346863},{"id":"https://openalex.org/keywords/sampling-bias","display_name":"Sampling bias","score":0.32989999651908875}],"concepts":[{"id":"https://openalex.org/C2777159308","wikidata":"https://www.wikidata.org/wiki/Q1757948","display_name":"Formality","level":2,"score":0.675000011920929},{"id":"https://openalex.org/C169087156","wikidata":"https://www.wikidata.org/wiki/Q2131593","display_name":"Framing (construction)","level":2,"score":0.5863999724388123},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5285999774932861},{"id":"https://openalex.org/C37773902","wikidata":"https://www.wikidata.org/wiki/Q970594","display_name":"Cultural bias","level":2,"score":0.5109999775886536},{"id":"https://openalex.org/C136714292","wikidata":"https://www.wikidata.org/wiki/Q1440683","display_name":"Framing effect","level":3,"score":0.4902999997138977},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.46309998631477356},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.38670000433921814},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37709999084472656},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.373199999332428},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.37209999561309814},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.35569998621940613},{"id":"https://openalex.org/C79585631","wikidata":"https://www.wikidata.org/wiki/Q431498","display_name":"Confirmation bias","level":2,"score":0.35010001063346863},{"id":"https://openalex.org/C75917345","wikidata":"https://www.wikidata.org/wiki/Q2725298","display_name":"Sampling bias","level":3,"score":0.32989999651908875},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.3271999955177307},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.3246000111103058},{"id":"https://openalex.org/C125209646","wikidata":"https://www.wikidata.org/wiki/Q1338878","display_name":"Cultural diversity","level":2,"score":0.287200003862381},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.28349998593330383},{"id":"https://openalex.org/C134801348","wikidata":"https://www.wikidata.org/wiki/Q7140425","display_name":"Non-response bias","level":2,"score":0.27730000019073486},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.2694999873638153},{"id":"https://openalex.org/C2983427547","wikidata":"https://www.wikidata.org/wiki/Q93200","display_name":"Gender bias","level":2,"score":0.26600000262260437},{"id":"https://openalex.org/C158600405","wikidata":"https://www.wikidata.org/wiki/Q5054566","display_name":"Causal inference","level":2,"score":0.2648000121116638},{"id":"https://openalex.org/C7220189","wikidata":"https://www.wikidata.org/wiki/Q52827","display_name":"Pictogram","level":2,"score":0.26350000500679016},{"id":"https://openalex.org/C138268822","wikidata":"https://www.wikidata.org/wiki/Q1051925","display_name":"Resolution (logic)","level":2,"score":0.2619999945163727},{"id":"https://openalex.org/C159447121","wikidata":"https://www.wikidata.org/wiki/Q490535","display_name":"Response bias","level":2,"score":0.25920000672340393},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.25189998745918274}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2025.emnlp-main.818","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.818","pdf_url":"https://aclanthology.org/2025.emnlp-main.818.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2025.emnlp-main.818","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.emnlp-main.818","pdf_url":"https://aclanthology.org/2025.emnlp-main.818.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Conference on Empirical Methods in Natural Language Processing","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4416036342.pdf","grobid_xml":"https://content.openalex.org/works/W4416036342.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"With":[0],"the":[1,56,160],"widespread":[2],"adoption":[3],"of":[4,55,129,162],"Large":[5],"Language":[6],"Models":[7],"(LLMs)":[8],"across":[9,19,72],"various":[10],"applications,":[11],"it":[12],"is":[13],"imperative":[14],"to":[15,37],"ensure":[16],"their":[17],"fairness":[18],"all":[20],"user":[21],"communities.However,":[22],"most":[23],"LLMs":[24,105],"are":[25,98,155],"trained":[26],"and":[27,40,51,78,94,109,144,165],"evaluated":[28],"on":[29],"Western":[30],"centric":[31],"data,":[32],"with":[33,131],"little":[34],"attention":[35],"paid":[36],"lowresource":[38],"languages":[39],"regional":[41,92],"contexts.To":[42],"address":[43],"this":[44],"gap,":[45],"we":[46],"introduce":[47],"PakBBQ,":[48],"a":[49],"culturally":[50],"regionally":[52],"adapted":[53],"extension":[54],"original":[57],"Bias":[58],"Benchmark":[59],"for":[60,170],"Question":[61],"Answering":[62],"(BBQ)":[63],"dataset.PakBBQ":[64],"comprises":[65],"over":[66],"214":[67],"templates,":[68],"17180":[69],"QA":[70],"pairs":[71],"8":[73],"categories":[74],"in":[75,100,139,142,173],"both":[76,107],"English":[77],"Urdu,":[79],"covering":[80],"eight":[81],"bias":[82,137,171],"dimensions":[83],"including":[84],"age,":[85],"disability,":[86],"appearance,":[87],"gender,":[88],"socio-economic":[89],"status,":[90],"religious,":[91],"affiliation,":[93],"language":[95],"formality":[96],"that":[97,149],"relevant":[99],"Pakistan.We":[101],"evaluate":[102],"multiple":[103],"multilingual":[104],"under":[106],"ambiguous":[108],"explicitly":[110],"disambiguated":[111],"contexts,":[112],"as":[113,115],"well":[114],"negative":[116,119],"versus":[117],"non":[118],"question":[120],"framings.Our":[121],"experiments":[122],"reveal":[123],"(i)":[124],"an":[125],"average":[126],"accuracy":[127],"gain":[128],"12%":[130],"disambiguation,":[132],"(ii)":[133],"consistently":[134],"stronger":[135],"counter":[136],"behaviors":[138],"Urdu":[140],"than":[141],"English,":[143],"(iii)":[145],"marked":[146],"framing":[147],"effects":[148],"reduce":[150],"stereotypical":[151],"responses":[152],"when":[153],"questions":[154],"posed":[156],"negatively.These":[157],"findings":[158],"highlight":[159],"importance":[161],"contextualized":[163],"benchmarks":[164],"simple":[166],"prompt":[167],"engineering":[168],"strategies":[169],"mitigation":[172],"low":[174],"resource":[175],"settings.":[176]},"counts_by_year":[],"updated_date":"2026-03-11T06:11:40.159057","created_date":"2025-11-08T00:00:00"}
