{"id":"https://openalex.org/W4399364491","doi":"https://doi.org/10.1145/3630106.3658940","title":"Generalized People Diversity: Learning a Human Perception-Aligned Diversity Representation for People Images","display_name":"Generalized People Diversity: Learning a Human Perception-Aligned Diversity Representation for People Images","publication_year":2024,"publication_date":"2024-06-03","ids":{"openalex":"https://openalex.org/W4399364491","doi":"https://doi.org/10.1145/3630106.3658940"},"language":"en","primary_location":{"id":"doi:10.1145/3630106.3658940","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3630106.3658940","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3630106.3658940","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The 2024 ACM Conference on Fairness Accountability and Transparency","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3630106.3658940","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5066181313","display_name":"Hansa Srinivasan","orcid":"https://orcid.org/0009-0004-9252-7754"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Hansa Srinivasan","raw_affiliation_strings":["Google, United States of America"],"affiliations":[{"raw_affiliation_string":"Google, United States of America","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027056673","display_name":"Candice Schumann","orcid":"https://orcid.org/0000-0002-2313-1279"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Candice Schumann","raw_affiliation_strings":["Google, USA"],"affiliations":[{"raw_affiliation_string":"Google, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079501833","display_name":"Aradhana Sinha","orcid":"https://orcid.org/0009-0006-0092-8214"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aradhana Sinha","raw_affiliation_strings":["Google, USA"],"affiliations":[{"raw_affiliation_string":"Google, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052778643","display_name":"David Madras","orcid":"https://orcid.org/0000-0001-6817-8743"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David Madras","raw_affiliation_strings":["Google, United States of America"],"affiliations":[{"raw_affiliation_string":"Google, United States of America","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001996369","display_name":"Gbolahan O. Olanubi","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gbolahan Oluwafemi Olanubi","raw_affiliation_strings":["Google, USA"],"affiliations":[{"raw_affiliation_string":"Google, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080988309","display_name":"Alex Beutel","orcid":"https://orcid.org/0000-0002-5917-2849"},"institutions":[{"id":"https://openalex.org/I4210161460","display_name":"OpenAI (United States)","ror":"https://ror.org/05wx9n238","country_code":"US","type":"company","lineage":["https://openalex.org/I4210161460"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alex Beutel","raw_affiliation_strings":["OpenAI, United States of America"],"affiliations":[{"raw_affiliation_string":"OpenAI, United States of America","institution_ids":["https://openalex.org/I4210161460"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088559113","display_name":"Susanna Ricco","orcid":"https://orcid.org/0009-0005-1505-7055"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Susanna Ricco","raw_affiliation_strings":["Google, USA"],"affiliations":[{"raw_affiliation_string":"Google, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033428202","display_name":"Jilin Chen","orcid":"https://orcid.org/0000-0002-3359-0938"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jilin Chen","raw_affiliation_strings":["Google, USA"],"affiliations":[{"raw_affiliation_string":"Google, USA","institution_ids":["https://openalex.org/I1291425158"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5066181313"],"corresponding_institution_ids":["https://openalex.org/I1291425158"],"apc_list":null,"apc_paid":null,"fwci":0.2632,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.49385915,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"797","last_page":"821"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8988000154495239,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8988000154495239,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.885200023651123,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.8321999907493591,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/diversity","display_name":"Diversity (politics)","score":0.755611777305603},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.7088303565979004},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.7045485973358154},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6408922672271729},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.6194557547569275},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6013324856758118},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.6011168956756592},{"id":"https://openalex.org/keywords/salient","display_name":"Salient","score":0.5199143290519714},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.5046979188919067},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.49583134055137634},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.4797888398170471},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.43057286739349365},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4123101532459259},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3909764587879181},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.39039233326911926},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.32076355814933777},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.24042698740959167},{"id":"https://openalex.org/keywords/sociology","display_name":"Sociology","score":0.1266181468963623},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.06683123111724854}],"concepts":[{"id":"https://openalex.org/C2781316041","wikidata":"https://www.wikidata.org/wiki/Q1230584","display_name":"Diversity (politics)","level":2,"score":0.755611777305603},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.7088303565979004},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.7045485973358154},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6408922672271729},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.6194557547569275},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6013324856758118},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.6011168956756592},{"id":"https://openalex.org/C2780719617","wikidata":"https://www.wikidata.org/wiki/Q1030752","display_name":"Salient","level":2,"score":0.5199143290519714},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.5046979188919067},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.49583134055137634},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4797888398170471},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.43057286739349365},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4123101532459259},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3909764587879181},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.39039233326911926},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32076355814933777},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.24042698740959167},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.1266181468963623},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.06683123111724854},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3630106.3658940","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3630106.3658940","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3630106.3658940","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The 2024 ACM Conference on Fairness Accountability and Transparency","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3630106.3658940","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3630106.3658940","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3630106.3658940","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The 2024 ACM Conference on Fairness Accountability and Transparency","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.7400000095367432,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4399364491.pdf"},"referenced_works_count":39,"referenced_works":["https://openalex.org/W1949009274","https://openalex.org/W1975517671","https://openalex.org/W2013456744","https://openalex.org/W2024082504","https://openalex.org/W2060658705","https://openalex.org/W2070134118","https://openalex.org/W2075778137","https://openalex.org/W2096912641","https://openalex.org/W2103612294","https://openalex.org/W2108598243","https://openalex.org/W2111336742","https://openalex.org/W2118509786","https://openalex.org/W2118573581","https://openalex.org/W2123432324","https://openalex.org/W2146649333","https://openalex.org/W2149252982","https://openalex.org/W2609731892","https://openalex.org/W2781551595","https://openalex.org/W2799258637","https://openalex.org/W2963775347","https://openalex.org/W2964247748","https://openalex.org/W3027050591","https://openalex.org/W3037594484","https://openalex.org/W3094231124","https://openalex.org/W3135367836","https://openalex.org/W3138773240","https://openalex.org/W3157831956","https://openalex.org/W3163396516","https://openalex.org/W3183266055","https://openalex.org/W3204130547","https://openalex.org/W3206428286","https://openalex.org/W4213264788","https://openalex.org/W4242177601","https://openalex.org/W4253763531","https://openalex.org/W4283168936","https://openalex.org/W4285395379","https://openalex.org/W4288083803","https://openalex.org/W4309618884","https://openalex.org/W4390872723"],"related_works":["https://openalex.org/W2329500892","https://openalex.org/W28991112","https://openalex.org/W2370726991","https://openalex.org/W2369710579","https://openalex.org/W4327728159","https://openalex.org/W2150136235","https://openalex.org/W2053591227","https://openalex.org/W2581240705","https://openalex.org/W2041353081","https://openalex.org/W2568183987"],"abstract_inverted_index":{"Capturing":[0],"the":[1,73,77,139,153],"diversity":[2,44,97,157],"of":[3,42,66,93,95,141],"people":[4,31,43],"in":[5,45,76,105],"images":[6],"is":[7,86,103,112,127],"challenging:":[8],"recent":[9],"literature":[10],"tends":[11],"to":[12,59,89,114,163],"focus":[13],"on":[14,129],"diversifying":[15],"one":[16],"or":[17,24,62],"two":[18,106],"attributes,":[19],"requiring":[20],"expensive":[21],"attribute":[22],"labels":[23],"building":[25],"classifiers.":[26],"We":[27],"introduce":[28],"a":[29,46,91,109,116,120],"diverse":[30],"image":[32],"ranking":[33,83],"method":[34,155],"which":[35],"more":[36],"flexibly":[37],"aligns":[38],"with":[39],"human":[40,133,167],"notions":[41],"less":[47],"prescriptive,":[48],"label-free":[49],"manner.":[50],"The":[51],"Perception-Aligned":[52],"Text-derived":[53],"Human":[54],"representation":[55,74,118,126],"Space":[56],"(PATHS)":[57],"aims":[58],"capture":[60],"all":[61],"many":[63],"relevant":[64],"features":[65],"people-related":[67,96,142],"diversity,":[68],"and,":[69],"when":[70],"used":[71,113],"as":[72],"space":[75],"standard":[78],"Maximal":[79],"Marginal":[80],"Relevance":[81],"(MMR)":[82],"algorithm":[84],"[7],":[85],"better":[87,158],"able":[88],"surface":[90],"range":[92],"types":[94],"(e.g.":[98],"disability,":[99],"cultural":[100],"attire).":[101],"PATHS":[102,154],"created":[104],"stages.":[107],"First,":[108],"text-guided":[110],"approach":[111],"extract":[115],"person-diversity":[117],"from":[119,132,166],"pre-trained":[121],"image-text":[122],"model.":[123],"Then":[124],"this":[125],"fine-tuned":[128],"perception":[130],"judgments":[131],"annotators":[134],"so":[135],"that":[136,144,152],"it":[137],"captures":[138],"aspects":[140],"similarity":[143],"humans":[145],"find":[146],"most":[147],"salient.":[148],"Empirical":[149],"results":[150],"show":[151],"achieves":[156],"than":[159],"baseline":[160],"methods,":[161],"according":[162],"side-by-side":[164],"ratings":[165],"annotators.":[168]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
