{"id":"https://openalex.org/W7124596654","doi":"https://doi.org/10.1016/j.patcog.2026.113091","title":"DemoFace: A Demographic Pixelated Face Biometric Image-Text Embedding Dataset with Fairness Baselines","display_name":"DemoFace: A Demographic Pixelated Face Biometric Image-Text Embedding Dataset with Fairness Baselines","publication_year":2026,"publication_date":"2026-01-17","ids":{"openalex":"https://openalex.org/W7124596654","doi":"https://doi.org/10.1016/j.patcog.2026.113091"},"language":"en","primary_location":{"id":"doi:10.1016/j.patcog.2026.113091","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.patcog.2026.113091","pdf_url":null,"source":{"id":"https://openalex.org/S414566","display_name":"Pattern Recognition","issn_l":"0031-3203","issn":["0031-3203","1873-5142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Pattern Recognition","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1016/j.patcog.2026.113091","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5123288398","display_name":"Abu Sufian","orcid":null},"institutions":[{"id":"https://openalex.org/I4210146308","display_name":"Institute of Intelligent Systems for Automation","ror":"https://ror.org/051t1q308","country_code":"IT","type":"facility","lineage":["https://openalex.org/I4210146308","https://openalex.org/I4210155236"]},{"id":"https://openalex.org/I4210155236","display_name":"National Research Council","ror":"https://ror.org/04zaypm56","country_code":"IT","type":"nonprofit","lineage":["https://openalex.org/I4210155236"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Abu Sufian","raw_affiliation_strings":["National Research Council of Italy - Institute of Applied Sciences and Intelligent Systems (CNR-ISASI), 73100 Lecce, LE, Italy"],"affiliations":[{"raw_affiliation_string":"National Research Council of Italy - Institute of Applied Sciences and Intelligent Systems (CNR-ISASI), 73100 Lecce, LE, Italy","institution_ids":["https://openalex.org/I4210155236","https://openalex.org/I4210146308"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002267907","display_name":"Anirudha Ghosh","orcid":"https://orcid.org/0009-0004-1465-0386"},"institutions":[{"id":"https://openalex.org/I130291710","display_name":"Visva-Bharati University","ror":"https://ror.org/02y28sc20","country_code":"IN","type":"education","lineage":["https://openalex.org/I130291710"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Anirudha Ghosh","raw_affiliation_strings":["Department of Computer and System Sciences, Visva-Bharati, Santiniketan, 731235, India"],"affiliations":[{"raw_affiliation_string":"Department of Computer and System Sciences, Visva-Bharati, Santiniketan, 731235, India","institution_ids":["https://openalex.org/I130291710"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002635411","display_name":"Debaditya Barman","orcid":"https://orcid.org/0000-0002-7562-119X"},"institutions":[{"id":"https://openalex.org/I130291710","display_name":"Visva-Bharati University","ror":"https://ror.org/02y28sc20","country_code":"IN","type":"education","lineage":["https://openalex.org/I130291710"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Debaditya Barman","raw_affiliation_strings":["Department of Computer and System Sciences, Visva-Bharati, Santiniketan, 731235, India"],"affiliations":[{"raw_affiliation_string":"Department of Computer and System Sciences, Visva-Bharati, Santiniketan, 731235, India","institution_ids":["https://openalex.org/I130291710"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Cosimo Distante","orcid":"https://orcid.org/0000-0002-1073-2390"},"institutions":[{"id":"https://openalex.org/I4210146308","display_name":"Institute of Intelligent Systems for Automation","ror":"https://ror.org/051t1q308","country_code":"IT","type":"facility","lineage":["https://openalex.org/I4210146308","https://openalex.org/I4210155236"]},{"id":"https://openalex.org/I4210155236","display_name":"National Research Council","ror":"https://ror.org/04zaypm56","country_code":"IT","type":"nonprofit","lineage":["https://openalex.org/I4210155236"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Cosimo Distante","raw_affiliation_strings":["National Research Council of Italy - Institute of Applied Sciences and Intelligent Systems (CNR-ISASI), 73100 Lecce, LE, Italy"],"affiliations":[{"raw_affiliation_string":"National Research Council of Italy - Institute of Applied Sciences and Intelligent Systems (CNR-ISASI), 73100 Lecce, LE, Italy","institution_ids":["https://openalex.org/I4210155236","https://openalex.org/I4210146308"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121766689","display_name":"Marco Leo","orcid":null},"institutions":[{"id":"https://openalex.org/I4210146308","display_name":"Institute of Intelligent Systems for Automation","ror":"https://ror.org/051t1q308","country_code":"IT","type":"facility","lineage":["https://openalex.org/I4210146308","https://openalex.org/I4210155236"]},{"id":"https://openalex.org/I4210155236","display_name":"National Research Council","ror":"https://ror.org/04zaypm56","country_code":"IT","type":"nonprofit","lineage":["https://openalex.org/I4210155236"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Marco Leo","raw_affiliation_strings":["National Research Council of Italy - Institute of Applied Sciences and Intelligent Systems (CNR-ISASI), 73100 Lecce, LE, Italy"],"affiliations":[{"raw_affiliation_string":"National Research Council of Italy - Institute of Applied Sciences and Intelligent Systems (CNR-ISASI), 73100 Lecce, LE, Italy","institution_ids":["https://openalex.org/I4210155236","https://openalex.org/I4210146308"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5028459279","display_name":"Farhana Sultana","orcid":"https://orcid.org/0000-0001-8334-6784"},"institutions":[{"id":"https://openalex.org/I33932797","display_name":"University of Gour Banga","ror":"https://ror.org/00pyh2y32","country_code":"IN","type":"education","lineage":["https://openalex.org/I33932797"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Farhana Sultana","raw_affiliation_strings":["Department of Computer Science, University of Gour Banga, English Bazar, 732103, India"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Gour Banga, English Bazar, 732103, India","institution_ids":["https://openalex.org/I33932797"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5123288398"],"corresponding_institution_ids":["https://openalex.org/I4210146308","https://openalex.org/I4210155236"],"apc_list":{"value":2710,"currency":"USD","value_usd":2710},"apc_paid":{"value":2710,"currency":"USD","value_usd":2710},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14388814,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"175","issue":null,"first_page":"113091","last_page":"113091"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9865000247955322,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9865000247955322,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10828","display_name":"Biometric Identification and Security","score":0.0032999999821186066,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.0017999999690800905,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/biometrics","display_name":"Biometrics","score":0.8269000053405762},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.6284000277519226},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5975000262260437},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5414000153541565},{"id":"https://openalex.org/keywords/facial-recognition-system","display_name":"Facial recognition system","score":0.4706000089645386},{"id":"https://openalex.org/keywords/scarcity","display_name":"Scarcity","score":0.42170000076293945},{"id":"https://openalex.org/keywords/data-set","display_name":"Data set","score":0.39890000224113464},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.33000001311302185}],"concepts":[{"id":"https://openalex.org/C184297639","wikidata":"https://www.wikidata.org/wiki/Q177765","display_name":"Biometrics","level":2,"score":0.8269000053405762},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7759000062942505},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.6284000277519226},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5975000262260437},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5846999883651733},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5414000153541565},{"id":"https://openalex.org/C31510193","wikidata":"https://www.wikidata.org/wiki/Q1192553","display_name":"Facial recognition system","level":3,"score":0.4706000089645386},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4620000123977661},{"id":"https://openalex.org/C109747225","wikidata":"https://www.wikidata.org/wiki/Q815758","display_name":"Scarcity","level":2,"score":0.42170000076293945},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.39890000224113464},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.33000001311302185},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3231000006198883},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.31779998540878296},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3138999938964844},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.3018999993801117},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.2897000014781952},{"id":"https://openalex.org/C2776207758","wikidata":"https://www.wikidata.org/wiki/Q5303302","display_name":"Downstream (manufacturing)","level":2,"score":0.2842000126838684},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.28299999237060547},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.2800999879837036},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.2745000123977661},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2565999925136566}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1016/j.patcog.2026.113091","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.patcog.2026.113091","pdf_url":null,"source":{"id":"https://openalex.org/S414566","display_name":"Pattern Recognition","issn_l":"0031-3203","issn":["0031-3203","1873-5142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Pattern Recognition","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1016/j.patcog.2026.113091","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.patcog.2026.113091","pdf_url":null,"source":{"id":"https://openalex.org/S414566","display_name":"Pattern Recognition","issn_l":"0031-3203","issn":["0031-3203","1873-5142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Pattern Recognition","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/5","display_name":"Gender equality","score":0.7534297704696655}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W2919115771","https://openalex.org/W3048511172","https://openalex.org/W3095695030","https://openalex.org/W3182380222","https://openalex.org/W3192864012","https://openalex.org/W3199041638","https://openalex.org/W4312193916","https://openalex.org/W4386472899","https://openalex.org/W4387377782","https://openalex.org/W4389671650","https://openalex.org/W4392122172","https://openalex.org/W4392672760","https://openalex.org/W4400859766","https://openalex.org/W4406208390","https://openalex.org/W4408865267"],"related_works":[],"abstract_inverted_index":{"\u2022":[0,18,37,69],"DemoFace":[1],"provides":[2],"a":[3,50,205],"demographically":[4],"balanced":[5,206],"pixelated":[6,212,263],"real":[7,213],"face":[8,15,66,160,195,208,214,279,290],"image":[9],"dataset":[10,47,209],"to":[11,57,91],"mitigate":[12],"biases":[13,34],"in":[14,35,65,84,101,110,166,189],"biometric":[16,67,117,196],"systems.":[17],"The":[19,245],"dataset\u2019s":[20],"structured":[21],"image\u2013text":[22],"embedding":[23,269],"multimodality":[24,270],"supports":[25],"downstream":[26,194],"tasks":[27,123,281],"and":[28,48,61,76,96,230,253,260,282,294,307,319],"facilitates":[29],"the":[30,46,59,154,170,187,327,336],"analysis":[31],"of":[32,52,63,124,156,172,216,275],"model":[33,182],"CVFMs.":[36],"Through":[38,70,286],"our":[39,71],"novel":[40],"Responsible":[41],"AI":[42,332],"methodology,":[43],"we":[44,79,202,300],"developed":[45],"established":[49,301],"set":[51,238],"baselines":[53,311],"using":[54,73,235],"SOTA":[55,86],"CVFMs":[56,64,192,276],"assess":[58],"performance":[60],"fairness":[62,97,188],"tasks.":[68,197],"evaluation":[72],"both":[74,317],"new":[75,318],"adapted":[77],"metrics,":[78],"revealed":[80],"inherent":[81,313],"bias":[82,283,314],"patterns":[83,315],"several":[85],"CVFMs,":[87],"providing":[88],"valuable":[89],"insights":[90],"guide":[92],"future":[93],"research.":[94],"Bias":[95],"are":[98,121,127,151],"critical":[99],"challenges":[100],"data-driven":[102],"computer":[103],"vision":[104],"(CV),":[105],"where":[106],"limited":[107],"demographic":[108,139,174,207,224],"diversity":[109],"training":[111],"data":[112],"worsens":[113],"these":[114,131,200],"challenges.":[115],"Face":[116],"(face":[118],"recognition)":[119],"systems":[120],"core":[122],"CV":[125,147,157],"that":[126],"highly":[128],"impacted":[129],"by":[130,227,255],"challenges,":[132],"as":[133,178,292,297],"existing":[134,324],"real-face":[135],"datasets":[136,144],"lack":[137],"comprehensive":[138],"representation,":[140],"whereas":[141],"current":[142],"synthetic":[143],"promote":[145],"stereotypes.":[146],"Foundation":[148],"Models":[149],"(CVFMs)":[150],"currently":[152],"at":[153],"forefront":[155],"applications,":[158],"including":[159],"biometrics,":[161],"which":[162],"use":[163],"global":[164],"features":[165],"multimodal":[167,175],"data.":[168],"However,":[169],"scarcity":[171],"large-scale,":[173],"datasets,":[176],"such":[177],"image-text":[179,268],"embeddings":[180],"for":[181,193,264,277,329],"fine-tuning":[183,272],"(or":[184,273],"training),":[185],"limits":[186],"state-of-the-art":[190],"(SOTA)":[191],"To":[198],"address":[199],"issues,":[201],"introduce":[203],"DemoFace,":[204],"comprising":[210],"30,240":[211],"images":[215,234,247],"672":[217],"representative":[218],"individuals":[219],"evenly":[220],"distributed":[221],"across":[222,304],"48":[223],"groups,":[225,259],"categorized":[226],"ethnicity/race,":[228,305],"gender,":[229,306],"age.":[231],"We":[232],"gathered":[233],"an":[236],"API":[237],"up":[239],"from":[240,323],"multiple":[241],"copyright-free":[242],"public":[243],"forums.":[244],"collected":[246],"were":[248],"then":[249,261],"manually":[250],"filtered,":[251],"anonymized,":[252],"annotated":[254],"two":[256,287],"independent":[257],"research":[258],"lightly":[262],"privacy":[265],"preservation.":[266],"DemoFace\u2019s":[267],"enables":[271],"training)":[274],"fairness-focused":[278],"biometrics":[280],"pattern":[284],"evaluation.":[285],"empirical":[288],"studies:":[289],"authentication":[291],"classification":[293],"textual":[295],"description":[296],"token":[298],"generation,":[299],"baseline":[302],"scores":[303],"age":[308],"groups.":[309],"Our":[310],"identified":[312],"through":[316],"tailored":[320],"metrics":[321],"derived":[322],"ones,":[325],"emphasizing":[326],"need":[328],"more":[330],"equitable":[331],"models.":[333],"Here":[334],"is":[335],"Repository:":[337],"Link":[338]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2026-01-19T00:00:00"}
