{"id":"https://openalex.org/W7139966286","doi":"https://doi.org/10.1016/j.procs.2026.01.018","title":"AI\u2013Driven Equity Evaluation Frameworks with Contrastive Models for Responsible Benchmarking in Natural Language Processing","display_name":"AI\u2013Driven Equity Evaluation Frameworks with Contrastive Models for Responsible Benchmarking in Natural Language Processing","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7139966286","doi":"https://doi.org/10.1016/j.procs.2026.01.018"},"language":"en","primary_location":{"id":"doi:10.1016/j.procs.2026.01.018","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.018","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1016/j.procs.2026.01.018","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5121733784","display_name":"Roohee Khan","orcid":null},"institutions":[{"id":"https://openalex.org/I2800614057","display_name":"Kalinga University","ror":"https://ror.org/03afg5j45","country_code":"IN","type":"education","lineage":["https://openalex.org/I2800614057"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Roohee Khan","raw_affiliation_strings":["Kalinga University, Naya Raipur, Chhattisgarh, India"],"affiliations":[{"raw_affiliation_string":"Kalinga University, Naya Raipur, Chhattisgarh, India","institution_ids":["https://openalex.org/I2800614057"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5123712200","display_name":"Ashu Nayak","orcid":null},"institutions":[{"id":"https://openalex.org/I2800614057","display_name":"Kalinga University","ror":"https://ror.org/03afg5j45","country_code":"IN","type":"education","lineage":["https://openalex.org/I2800614057"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Ashu Nayak","raw_affiliation_strings":["Kalinga University, Naya Raipur, Chhattisgarh, India"],"affiliations":[{"raw_affiliation_string":"Kalinga University, Naya Raipur, Chhattisgarh, India","institution_ids":["https://openalex.org/I2800614057"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5121733784"],"corresponding_institution_ids":["https://openalex.org/I2800614057"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.93715708,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":"275","issue":null,"first_page":"140","last_page":"147"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.28619998693466187,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.28619998693466187,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.2802000045776367,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.07109999656677246,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.8355000019073486},{"id":"https://openalex.org/keywords/equity","display_name":"Equity (law)","score":0.6352999806404114},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.4059000015258789},{"id":"https://openalex.org/keywords/natural-language-understanding","display_name":"Natural language understanding","score":0.3822000026702881},{"id":"https://openalex.org/keywords/natural","display_name":"Natural (archaeology)","score":0.29820001125335693}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8866999745368958},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.8355000019073486},{"id":"https://openalex.org/C199728807","wikidata":"https://www.wikidata.org/wiki/Q2578557","display_name":"Equity (law)","level":2,"score":0.6352999806404114},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4374000132083893},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4366999864578247},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.41269999742507935},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.4059000015258789},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.3822000026702881},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.35740000009536743},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.3208000063896179},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.29820001125335693},{"id":"https://openalex.org/C3018395757","wikidata":"https://www.wikidata.org/wiki/Q1379672","display_name":"Evaluation methods","level":2,"score":0.2768000066280365},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.2759000062942505},{"id":"https://openalex.org/C2777629044","wikidata":"https://www.wikidata.org/wiki/Q614959","display_name":"Contrastive analysis","level":2,"score":0.26840001344680786}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1016/j.procs.2026.01.018","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.018","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1016/j.procs.2026.01.018","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.018","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.5317912101745605}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W4378189609","https://openalex.org/W4385067602","https://openalex.org/W4387059617","https://openalex.org/W4387221236","https://openalex.org/W4390231631","https://openalex.org/W4390506533","https://openalex.org/W4390686696","https://openalex.org/W4390974852","https://openalex.org/W4390974969","https://openalex.org/W4391494845","https://openalex.org/W4391545757","https://openalex.org/W4392234077","https://openalex.org/W4392902463","https://openalex.org/W4393618909","https://openalex.org/W4394850884","https://openalex.org/W4398198142","https://openalex.org/W4400205824","https://openalex.org/W4401453382","https://openalex.org/W4402274395","https://openalex.org/W4403446022","https://openalex.org/W4404284060","https://openalex.org/W4404300986","https://openalex.org/W4405271521","https://openalex.org/W4406039161","https://openalex.org/W4410382551","https://openalex.org/W4410428252","https://openalex.org/W4410616178","https://openalex.org/W4410639293","https://openalex.org/W4410949762","https://openalex.org/W4416288646"],"related_works":[],"abstract_inverted_index":{"The":[0,42,141,167],"importance":[1],"of":[2,21,81,117,120,137,149,204,241],"equity":[3,212],"considerations":[4],"in":[5,36,92,114,129,178,180,213,229],"Natural":[6],"Language":[7],"Processing":[8],"(NLP)":[9],"has":[10],"grown":[11],"as":[12,52,73,161,187],"AI":[13],"systems":[14],"have":[15],"increasingly":[16],"affected":[17],"diverse":[18],"populations.":[19],"Assessment":[20],"benchmarking":[22],"for":[23,232,248,253],"responsible":[24,264],"deployment":[25],"incorporates":[26],"protocols":[27],"that":[28,173],"can":[29,196],"determine":[30],"with":[31,122,182],"certainty":[32],"and":[33,147,201,216,221,226,260,265],"minimize":[34],"biases":[35,228],"groups":[37],"defined":[38],"by":[39],"demographic":[40,188],"characteristics.":[41],"existing":[43],"evaluation":[44,82,203],"processes":[45],"are":[46,95],"skewed":[47],"towards":[48],"measuring":[49],"model":[50,94,154,205,230,258],"performance":[51,59],"a":[53,93,103,118,138,162,170,198],"single":[54],"score":[55,172],"or":[56,66,76,87,190],"an":[57],"aggregate":[58],"measure,":[60],"which":[61],"cannot":[62],"reveal":[63],"fine-grained":[64],"inequities":[65,86,242,259],"differences":[67,177],"based":[68,109],"on":[69,110],"sensitive":[70,131],"attributes,":[71],"such":[72,186],"gender,":[74],"race,":[75],"age":[77],"levels.":[78],"These":[79],"types":[80],"do":[83],"not":[84],"reflect":[85],"unfairness":[88],"when":[89],"specific":[90],"results":[91],"biased":[96],"downstream.":[97],"To":[98],"fill":[99],"this":[100],"gap,":[101],"introduce":[102],"Contrastive":[104],"Fairness":[105],"Evaluation":[106],"(CFE)":[107],"system":[108],"using":[111],"contrastive":[112,176],"inputs":[113],"the":[115,124,130,135,145,150,158,175,194,236,257],"form":[116],"pair":[119],"sentences":[121],"all":[123],"exact":[125],"words,":[126],"but":[127],"differing":[128],"attribute,":[132],"to":[133,164,210,251,255],"evaluate":[134],"fairness":[136,184],"given":[139],"model.":[140],"CFE":[142,168,207],"approach":[143,237],"uses":[144],"similarity":[146],"divergence":[148],"two":[151],"input":[152],"pairs\u2019":[153],"predictions,":[155],"measured":[156],"at":[157],"outcome":[159],"level,":[160],"unit":[163],"assess":[165,211],"inequalities.":[166],"provides":[169],"numeric":[171],"captures":[174],"outcomes,":[179],"line":[181],"established":[183],"assessments,":[185],"parity":[189],"equal":[191],"odds.":[192],"Furthermore,":[193],"framework":[195],"provide":[197],"more":[199,263],"interpretable":[200],"reliable":[202],"equity.":[206],"is":[208],"demonstrated":[209],"machine":[214],"translation":[215],"sentiment":[217],"analysis":[218],"(regarding":[219],"gender":[220,225],"race),":[222],"exposing":[223],"subtle":[224],"racial":[227],"outputs":[231],"both":[233],"tasks.":[234],"Moreover,":[235],"enables":[238],"effective":[239],"identification":[240],"while":[243],"simultaneously":[244],"providing":[245],"actionable":[246],"feedback":[247],"additional":[249],"training":[250],"plan":[252],"strategies":[254],"address":[256],"make":[261],"deployments":[262],"equitable.":[266]},"counts_by_year":[],"updated_date":"2026-03-22T06:25:25.174409","created_date":"2026-03-21T00:00:00"}
