{"id":"https://openalex.org/W4414321943","doi":"https://doi.org/10.1109/tip.2025.3609185","title":"Dual-View Alignment Learning With Hierarchical-Prompt for Class-Imbalance Multi-Label Image Classification","display_name":"Dual-View Alignment Learning With Hierarchical-Prompt for Class-Imbalance Multi-Label Image Classification","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4414321943","doi":"https://doi.org/10.1109/tip.2025.3609185","pmid":"https://pubmed.ncbi.nlm.nih.gov/40966154"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2025.3609185","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2025.3609185","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052560070","display_name":"Sheng Huang","orcid":"https://orcid.org/0000-0001-5610-0826"},"institutions":[{"id":"https://openalex.org/I1327237609","display_name":"Ministry of Education of the People's Republic of China","ror":"https://ror.org/01mv9t934","country_code":"CN","type":"government","lineage":["https://openalex.org/I1327237609","https://openalex.org/I4210127390"]},{"id":"https://openalex.org/I4210094876","display_name":"Ministry of Education","ror":"https://ror.org/00q919b81","country_code":"SA","type":"government","lineage":["https://openalex.org/I4210094876"]}],"countries":["CN","SA"],"is_corresponding":true,"raw_author_name":"Sheng Huang","raw_affiliation_strings":["Key Laboratory of Dependable Service Computing in Cyber Physical Society, Ministry of Education, Chongqing University, Chongqing, Chongqing, China","Key Laboratory of Dependable Service Computing in Cyber Physical Society, Ministry of Education, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Dependable Service Computing in Cyber Physical Society, Ministry of Education, Chongqing University, Chongqing, Chongqing, China","institution_ids":["https://openalex.org/I4210094876"]},{"raw_affiliation_string":"Key Laboratory of Dependable Service Computing in Cyber Physical Society, Ministry of Education, Chongqing, China","institution_ids":["https://openalex.org/I1327237609"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103534250","display_name":"Jiexuan Yan","orcid":null},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiexuan Yan","raw_affiliation_strings":["School of Big Data and Software Engineering, Chongqing University, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"School of Big Data and Software Engineering, Chongqing University, Chongqing, China","institution_ids":["https://openalex.org/I158842170"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066647707","display_name":"Beiyan Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]},{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Beiyan Liu","raw_affiliation_strings":["School of Big Data and Software Engineering, Chongqing University, Chongqing, China","School of Computer Science and Information Engineering, Hefei University of Technology, Hefei, China"],"affiliations":[{"raw_affiliation_string":"School of Big Data and Software Engineering, Chongqing University, Chongqing, China","institution_ids":["https://openalex.org/I158842170"]},{"raw_affiliation_string":"School of Computer Science and Information Engineering, Hefei University of Technology, Hefei, China","institution_ids":["https://openalex.org/I16365422"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100656118","display_name":"Bo Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]},{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Liu","raw_affiliation_strings":["School of Big Data and Software Engineering, Chongqing University, Chongqing, China","School of Computer Science and Information Engineering, Hefei University of Technology, Hefei, China"],"affiliations":[{"raw_affiliation_string":"School of Big Data and Software Engineering, Chongqing University, Chongqing, China","institution_ids":["https://openalex.org/I158842170"]},{"raw_affiliation_string":"School of Computer Science and Information Engineering, Hefei University of Technology, Hefei, China","institution_ids":["https://openalex.org/I16365422"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5051332325","display_name":"Richang Hong","orcid":"https://orcid.org/0000-0001-5461-3986"},"institutions":[{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Richang Hong","raw_affiliation_strings":["School of Computer Science and Information Engineering, Hefei University of Technology, Hefei, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Information Engineering, Hefei University of Technology, Hefei, China","institution_ids":["https://openalex.org/I16365422"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5052560070"],"corresponding_institution_ids":["https://openalex.org/I1327237609","https://openalex.org/I4210094876"],"apc_list":null,"apc_paid":null,"fwci":2.3568,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.9109335,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"34","issue":null,"first_page":"5989","last_page":"6001"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9470000267028809,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9470000267028809,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/contextual-image-classification","display_name":"Contextual image classification","score":0.6403999924659729},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6373999714851379},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5616999864578247},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5160999894142151},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5033000111579895},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4878999888896942},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4851999878883362},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.4794999957084656}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7718999981880188},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7516000270843506},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.6403999924659729},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6373999714851379},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5616999864578247},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5160999894142151},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5033000111579895},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4878999888896942},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4851999878883362},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.4794999957084656},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4715999960899353},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4124000072479248},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.41200000047683716},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.3122999966144562},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.29649999737739563},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2903999984264374},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.28679999709129333},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.28459998965263367},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.28450000286102295},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2833000123500824},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.2791000008583069},{"id":"https://openalex.org/C110083411","wikidata":"https://www.wikidata.org/wiki/Q1744628","display_name":"Statistical classification","level":2,"score":0.2718000113964081},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2680000066757202},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.2515000104904175}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tip.2025.3609185","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2025.3609185","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:40966154","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40966154","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1585896628","display_name":null,"funder_award_id":"62176030","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7432550059","display_name":null,"funder_award_id":"2023CDJYGRH-YB18","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Real-world":[0],"datasets":[1],"often":[2],"exhibit":[3],"class":[4],"imbalance":[5,29],"across":[6],"multiple":[7],"categories,":[8],"manifesting":[9],"as":[10],"long-tailed":[11,179],"distributions":[12],"and":[13,30,111,117,156,175,184,186],"few-shot":[14,191],"scenarios.":[15],"This":[16],"is":[17,149],"especially":[18],"challenging":[19],"in":[20,67,141],"Class-Imbalanced":[21],"Multi-Label":[22],"Image":[23],"Classification":[24],"(CI-MLIC)":[25],"tasks,":[26,101],"where":[27],"data":[28],"multi-object":[31],"recognition":[32],"present":[33],"significant":[34],"obstacles.":[35],"To":[36,94],"address":[37],"these":[38],"challenges,":[39],"we":[40,102,122],"propose":[41],"a":[42,104,124],"novel":[43],"method":[44,166],"termed":[45],"Dual-View":[46],"Alignment":[47],"Learning":[48],"with":[49],"Hierarchical":[50],"Prompt":[51],"(HP-DVAL),":[52],"which":[53],"leverages":[54],"multi-modal":[55],"knowledge":[56,139],"from":[57,83,135,137],"vision-language":[58],"pretrained":[59],"(VLP)":[60],"models":[61,85,98],"to":[62,76,114,131],"mitigate":[63],"the":[64,78,162,178,189],"class-imbalance":[65],"problem":[66],"multi-label":[68,180,190],"settings.":[69],"Specifically,":[70],"HP-DVAL":[71],"employs":[72],"dual-view":[73],"alignment":[74],"learning":[75],"transfer":[77],"powerful":[79],"feature":[80],"representation":[81],"capabilities":[82],"VLP":[84,97,142],"by":[86],"extracting":[87],"complementary":[88],"features":[89],"for":[90,99],"accurate":[91],"image-text":[92],"alignment.":[93],"better":[95],"adapt":[96],"CI-MLIC":[100,153],"introduce":[103],"hierarchical":[105],"prompt-tuning":[106],"strategy":[107],"that":[108],"utilizes":[109],"global":[110],"local":[112],"prompts":[113,134],"learn":[115],"task-specific":[116],"context-related":[118],"prior":[119],"knowledge.":[120],"Additionally,":[121],"design":[123],"semantic":[125],"consistency":[126],"loss":[127],"during":[128],"prompt":[129],"tuning":[130],"prevent":[132],"learned":[133],"deviating":[136],"general":[138],"embedded":[140],"models.":[143],"The":[144],"effectiveness":[145],"of":[146,164,173],"our":[147,165],"approach":[148],"validated":[150],"on":[151,177,188],"two":[152],"benchmarks:":[154],"MS-COCO":[155],"VOC2007.":[157],"Extensive":[158],"experimental":[159],"results":[160],"demonstrate":[161],"superiority":[163],"over":[167],"SOTA":[168],"approaches,":[169],"achieving":[170],"mAP":[171],"improvements":[172],"10.0%":[174],"5.2%":[176],"image":[181,192],"classification":[182,193],"task,":[183],"6.8%":[185],"2.9%":[187],"task.":[194]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
