{"id":"https://openalex.org/W4403791856","doi":"https://doi.org/10.1145/3664647.3681171","title":"Category-Prompt Refined Feature Learning for Long-Tailed Multi-Label Image Classification","display_name":"Category-Prompt Refined Feature Learning for Long-Tailed Multi-Label Image Classification","publication_year":2024,"publication_date":"2024-10-26","ids":{"openalex":"https://openalex.org/W4403791856","doi":"https://doi.org/10.1145/3664647.3681171"},"language":"en","primary_location":{"id":"doi:10.1145/3664647.3681171","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3681171","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103534250","display_name":"Jiexuan Yan","orcid":null},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiexuan Yan","raw_affiliation_strings":["School of Big Data &amp; Software Engineering, Chongqing University, Chongqing, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"School of Big Data &amp; Software Engineering, Chongqing University, Chongqing, Chongqing, China","institution_ids":["https://openalex.org/I158842170"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052560070","display_name":"Sheng Huang","orcid":"https://orcid.org/0000-0001-5610-0826"},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sheng Huang","raw_affiliation_strings":["School of Big Data &amp; Software Engineering, Chongqing University, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"School of Big Data &amp; Software Engineering, Chongqing University, Chongqing, China","institution_ids":["https://openalex.org/I158842170"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114416565","display_name":"NanKun Mu","orcid":"https://orcid.org/0000-0001-9713-4416"},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"NanKun Mu","raw_affiliation_strings":["College of Computer Science, Chongqing University, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science, Chongqing University, Chongqing, China","institution_ids":["https://openalex.org/I158842170"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037518351","display_name":"Luwen Huangfu","orcid":null},"institutions":[{"id":"https://openalex.org/I26538001","display_name":"San Diego State University","ror":"https://ror.org/0264fdx42","country_code":"US","type":"education","lineage":["https://openalex.org/I26538001"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Luwen Huangfu","raw_affiliation_strings":["Fowler College of Business, San Diego State University, San Diego, CA, USA"],"affiliations":[{"raw_affiliation_string":"Fowler College of Business, San Diego State University, San Diego, CA, USA","institution_ids":["https://openalex.org/I26538001"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100656118","display_name":"Bo Liu","orcid":"https://orcid.org/0000-0002-8678-2271"},"institutions":[{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Liu","raw_affiliation_strings":["School of Computer Science and Information Engineering, Hefei University of Technology, Hefei, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Information Engineering, Hefei University of Technology, Hefei, China","institution_ids":["https://openalex.org/I16365422"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5103534250"],"corresponding_institution_ids":["https://openalex.org/I158842170"],"apc_list":null,"apc_paid":null,"fwci":1.5448,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.85652748,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"2146","last_page":"2155"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.992900013923645,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6802910566329956},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6672996878623962},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6351813077926636},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6136990189552307},{"id":"https://openalex.org/keywords/contextual-image-classification","display_name":"Contextual image classification","score":0.5604603290557861},{"id":"https://openalex.org/keywords/multi-label-classification","display_name":"Multi-label classification","score":0.465399831533432},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.456390380859375},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4100446105003357},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.35455137491226196}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6802910566329956},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6672996878623962},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6351813077926636},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6136990189552307},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.5604603290557861},{"id":"https://openalex.org/C2776482837","wikidata":"https://www.wikidata.org/wiki/Q3553958","display_name":"Multi-label classification","level":2,"score":0.465399831533432},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.456390380859375},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4100446105003357},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35455137491226196},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3664647.3681171","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3681171","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W2108598243","https://openalex.org/W2118978333","https://openalex.org/W2146241755","https://openalex.org/W2183341477","https://openalex.org/W2194775991","https://openalex.org/W2250539671","https://openalex.org/W2440599146","https://openalex.org/W2736688973","https://openalex.org/W2932399282","https://openalex.org/W2962933664","https://openalex.org/W2963351448","https://openalex.org/W2963691377","https://openalex.org/W2963745697","https://openalex.org/W2982112268","https://openalex.org/W3034601242","https://openalex.org/W3035730922","https://openalex.org/W3109067582","https://openalex.org/W3138516171","https://openalex.org/W3167456680","https://openalex.org/W3171625335","https://openalex.org/W3174320978","https://openalex.org/W3174396085","https://openalex.org/W3179096061","https://openalex.org/W3198377975","https://openalex.org/W4214673031","https://openalex.org/W4225922615","https://openalex.org/W4312310776","https://openalex.org/W4366352743","https://openalex.org/W4382450414","https://openalex.org/W4382468523","https://openalex.org/W4386113259","https://openalex.org/W4390873052","https://openalex.org/W4390873546","https://openalex.org/W4391307106"],"related_works":["https://openalex.org/W2039871688","https://openalex.org/W3147584709","https://openalex.org/W2017214274","https://openalex.org/W1600005011","https://openalex.org/W2977677679","https://openalex.org/W4289128054","https://openalex.org/W2883491016","https://openalex.org/W4205999209","https://openalex.org/W2735080633","https://openalex.org/W2565656575"],"abstract_inverted_index":{"Real-world":[0],"data":[1,32],"consistently":[2],"exhibits":[3],"a":[4,46,113],"long-tailed":[5],"distribution,":[6],"often":[7],"spanning":[8],"multiple":[9],"categories.":[10],"This":[11],"complexity":[12],"underscores":[13],"the":[14,78,94,100,107,120,131,135,139,144,147,154,160,177,183,196],"challenge":[15],"of":[16,96,138,146,185,198],"content":[17],"comprehension,":[18],"particularly":[19],"in":[20],"scenarios":[21],"requiring":[22],"Long-Tailed":[23],"Multi-Label":[24],"image":[25],"Classification":[26],"(LTMLC).":[27],"In":[28],"such":[29],"contexts,":[30],"imbalanced":[31],"distribution":[33],"and":[34,48,65,82,102,174,192],"multi-object":[35],"recognition":[36,179],"pose":[37],"significant":[38],"hurdles.":[39],"To":[40,105],"address":[41],"this":[42],"issue,":[43],"we":[44,111,158],"propose":[45],"novel":[47],"effective":[49],"approach":[50],"for":[51,70],"LTMLC,":[52],"termed":[53],"Category-Prompt":[54],"Refined":[55],"Feature":[56],"Learning":[57],"(CPRFL),":[58],"utilizing":[59],"semantic":[60,97],"correlations":[61,98],"between":[62,99],"different":[63],"categories":[64],"decoupling":[66],"category-specific":[67,84,140],"visual":[68,85,90,126,141],"representations":[69,86,142],"each":[71],"category.":[72],"Specifically,":[73],"CPRFL":[74],"initializes":[75],"category-prompts":[76],"from":[77],"pretrained":[79],"CLIP's":[80],"embeddings":[81],"decouples":[83],"through":[87],"interaction":[88],"with":[89],"features,":[91],"thereby":[92],"facilitating":[93],"establishment":[95],"head":[101],"tail":[103],"classes.":[104],"mitigate":[106],"visual-semantic":[108],"domain":[109],"bias,":[110],"design":[112],"progressive":[114,136],"Dual-Path":[115],"Back-Propagation":[116],"mechanism":[117],"to":[118,167],"refine":[119],"prompts":[121],"by":[122],"progressively":[123],"incorporating":[124],"context-related":[125],"information":[127],"into":[128,152],"prompts.":[129,149],"Simultaneously,":[130],"refinement":[132],"process":[133],"facilitates":[134],"purification":[137],"under":[143],"guidance":[145],"refined":[148],"Furthermore,":[150],"taking":[151],"account":[153],"negative-positive":[155],"sample":[156],"imbalance,":[157],"adopt":[159],"Asymmetric":[161],"Loss":[162],"as":[163],"our":[164,186,199],"optimization":[165],"objective":[166],"suppress":[168],"negative":[169],"samples":[170],"across":[171],"all":[172],"classes":[173],"potentially":[175],"enhance":[176],"head-to-tail":[178],"performance.":[180],"We":[181],"validate":[182],"effectiveness":[184],"method":[187],"on":[188],"two":[189],"LTMLC":[190],"benchmarks":[191],"extensive":[193],"experiments":[194],"demonstrate":[195],"superiority":[197],"work":[200],"over":[201],"baselines.The":[202],"code":[203],"is":[204],"available":[205],"at":[206],"https://github.com/jiexuanyan/CPRFL.":[207]},"counts_by_year":[{"year":2025,"cited_by_count":4}],"updated_date":"2025-12-21T23:12:01.093139","created_date":"2025-10-10T00:00:00"}
