{"id":"https://openalex.org/W4416799450","doi":"https://doi.org/10.1109/apsipaasc65261.2025.11249300","title":"Reducing Implicit Class Imbalance in Unlabeled Datasets Using Text-Specified Sensitive Attributes","display_name":"Reducing Implicit Class Imbalance in Unlabeled Datasets Using Text-Specified Sensitive Attributes","publication_year":2025,"publication_date":"2025-10-22","ids":{"openalex":"https://openalex.org/W4416799450","doi":"https://doi.org/10.1109/apsipaasc65261.2025.11249300"},"language":null,"primary_location":{"id":"doi:10.1109/apsipaasc65261.2025.11249300","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc65261.2025.11249300","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120570675","display_name":"Kosei Suayama","orcid":null},"institutions":[{"id":"https://openalex.org/I161296585","display_name":"Tokyo University of Science","ror":"https://ror.org/05sj3n476","country_code":"JP","type":"education","lineage":["https://openalex.org/I161296585"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kosei Suayama","raw_affiliation_strings":["Tokyo University of Science,Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tokyo University of Science,Japan","institution_ids":["https://openalex.org/I161296585"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5058191809","display_name":"Kazuaki Nakamura","orcid":"https://orcid.org/0000-0002-4859-4624"},"institutions":[{"id":"https://openalex.org/I161296585","display_name":"Tokyo University of Science","ror":"https://ror.org/05sj3n476","country_code":"JP","type":"education","lineage":["https://openalex.org/I161296585"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kazuaki Nakamura","raw_affiliation_strings":["Tokyo University of Science,Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tokyo University of Science,Japan","institution_ids":["https://openalex.org/I161296585"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.17652011,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"2032","last_page":"2037"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.4016999900341034,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.4016999900341034,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.251800000667572,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.09939999878406525,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.7361999750137329},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.6568999886512756},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.6326000094413757},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5591999888420105},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.508899986743927},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.4309999942779541}],"concepts":[{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.7361999750137329},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7131999731063843},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.6568999886512756},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.6326000094413757},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.630299985408783},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5591999888420105},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.508899986743927},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.43230000138282776},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.4309999942779541},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.365200012922287},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.36329999566078186},{"id":"https://openalex.org/C164866538","wikidata":"https://www.wikidata.org/wiki/Q367351","display_name":"Cluster (spacecraft)","level":2,"score":0.34040001034736633},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.2849999964237213},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2824999988079071},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.25679999589920044},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.251800000667572}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apsipaasc65261.2025.11249300","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc65261.2025.11249300","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W2081580037","https://openalex.org/W2104933073","https://openalex.org/W2592232824","https://openalex.org/W2963351448","https://openalex.org/W2963613787","https://openalex.org/W2963691377","https://openalex.org/W2971581288","https://openalex.org/W3009883635","https://openalex.org/W3087783715","https://openalex.org/W3092661284","https://openalex.org/W4405989400"],"related_works":[],"abstract_inverted_index":{"Modern":[0],"AI":[1],"models":[2],"sometimes":[3],"output":[4],"biased":[5,26],"results":[6,190],"on":[7,68,99,195],"sensitive":[8],"attributes":[9],"(SA)":[10],"such":[11],"as":[12,100,171],"\u201crace\u201d":[13,200],"and":[14,174,201],"\u201cage\u201d,":[15,202],"which":[16,94],"can":[17],"cause":[18],"a":[19,29,43,87,107,139,144,163,186,218],"social":[20],"issue.":[21],"A":[22],"reason":[23],"for":[24,79,109],"these":[25],"outputs":[27],"is":[28,46,208],"class":[30,40,50,62,73,113,215],"imbalance":[31,41,51,74,114,216],"problem":[32,70],"in":[33,56,75,115,138,217],"the":[34,39,49,69,111,157,168,176,205,213],"training":[35],"dataset.":[36,159,188,222],"Therefore,":[37],"reducing":[38,110,212],"of":[42,71,179,191,198,210],"given":[44,219],"dataset":[45,142],"important.":[47],"Although":[48],"could":[52],"be":[53,97],"implicitly":[54],"contained":[55],"unlabeled":[57,76,116,220],"datasets":[58,117],"that":[59,118,204],"have":[60],"no":[61,64],"labels,":[63,173],"existing":[65],"studies":[66],"focus":[67],"implicit":[72,112,214],"datasets,":[77],"except":[78],"our":[80,84,192],"previous":[81],"work.":[82],"Even":[83],"method":[85,108,128,207],"has":[86],"serious":[88],"drawback:":[89],"it":[90],"cannot":[91],"explicitly":[92],"specify":[93,122],"attribute":[95],"should":[96],"focused":[98],"SA.":[101],"In":[102],"this":[103],"paper,":[104],"we":[105,161],"propose":[106],"allows":[119],"us":[120],"to":[121,155,184],"SA":[123],"by":[124],"text.":[125],"The":[126,149,189],"proposed":[127,206],"first":[129],"extracts":[130],"an":[131],"SA-related":[132],"visual":[133],"feature":[134],"from":[135,181],"each":[136,182],"image":[137],"target":[140,158],"imbalanced":[141],"using":[143],"vision-language":[145],"model":[146],"called":[147],"CLIP.":[148],"extracted":[150],"features":[151],"are":[152],"next":[153],"utilized":[154],"cluster":[156,169],"Then,":[160],"train":[162],"conditional":[164],"diffusion":[165],"model,":[166],"regarding":[167],"IDs":[170],"pseudoclass":[172],"generate":[175],"same":[177],"number":[178],"images":[180],"pseudo-class":[183],"construct":[185],"balanced":[187],"experiments":[193],"focusing":[194],"two":[196],"types":[197],"SA,":[199],"demonstrated":[203],"capable":[209],"effectively":[211],"face":[221]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-11-28T00:00:00"}
