{"id":"https://openalex.org/W4405706077","doi":"https://doi.org/10.1145/3708991","title":"Learning Semantic-aware Representation in Visual-Language Models for Multi-label Recognition with Partial Labels","display_name":"Learning Semantic-aware Representation in Visual-Language Models for Multi-label Recognition with Partial Labels","publication_year":2024,"publication_date":"2024-12-23","ids":{"openalex":"https://openalex.org/W4405706077","doi":"https://doi.org/10.1145/3708991"},"language":"en","primary_location":{"id":"doi:10.1145/3708991","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3708991","pdf_url":null,"source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5115612477","display_name":"Haoxian Ruan","orcid":null},"institutions":[{"id":"https://openalex.org/I139024713","display_name":"Guangdong University of Technology","ror":"https://ror.org/04azbjn80","country_code":"CN","type":"education","lineage":["https://openalex.org/I139024713"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Haoxian Ruan","raw_affiliation_strings":["Guangdong University of Technology, Guangzhou, China","Guangdong University of Technology, China"],"affiliations":[{"raw_affiliation_string":"Guangdong University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I139024713"]},{"raw_affiliation_string":"Guangdong University of Technology, China","institution_ids":["https://openalex.org/I139024713"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058542486","display_name":"Zhihua Xu","orcid":"https://orcid.org/0000-0002-0731-4585"},"institutions":[{"id":"https://openalex.org/I139024713","display_name":"Guangdong University of Technology","ror":"https://ror.org/04azbjn80","country_code":"CN","type":"education","lineage":["https://openalex.org/I139024713"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhihua Xu","raw_affiliation_strings":["Guangdong University of Technology, Guangzhou, China","Guangdong University of Technology, China"],"affiliations":[{"raw_affiliation_string":"Guangdong University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I139024713"]},{"raw_affiliation_string":"Guangdong University of Technology, China","institution_ids":["https://openalex.org/I139024713"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064465418","display_name":"Zhijing Yang","orcid":"https://orcid.org/0000-0001-8336-5109"},"institutions":[{"id":"https://openalex.org/I139024713","display_name":"Guangdong University of Technology","ror":"https://ror.org/04azbjn80","country_code":"CN","type":"education","lineage":["https://openalex.org/I139024713"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhijing Yang","raw_affiliation_strings":["Information Engineering, Guangdong University of Technology, Guangzhou, China","Guangdong University of Technology, China"],"affiliations":[{"raw_affiliation_string":"Information Engineering, Guangdong University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I139024713"]},{"raw_affiliation_string":"Guangdong University of Technology, China","institution_ids":["https://openalex.org/I139024713"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081352580","display_name":"Yongyi Lu","orcid":"https://orcid.org/0000-0003-1398-9965"},"institutions":[{"id":"https://openalex.org/I139024713","display_name":"Guangdong University of Technology","ror":"https://ror.org/04azbjn80","country_code":"CN","type":"education","lineage":["https://openalex.org/I139024713"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongyi Lu","raw_affiliation_strings":["Guangdong University of Technology, Guangzhou, China","Guangdong University of Technology, China"],"affiliations":[{"raw_affiliation_string":"Guangdong University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I139024713"]},{"raw_affiliation_string":"Guangdong University of Technology, China","institution_ids":["https://openalex.org/I139024713"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091494473","display_name":"Jinghui Qin","orcid":"https://orcid.org/0000-0003-0663-199X"},"institutions":[{"id":"https://openalex.org/I139024713","display_name":"Guangdong University of Technology","ror":"https://ror.org/04azbjn80","country_code":"CN","type":"education","lineage":["https://openalex.org/I139024713"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinghui Qin","raw_affiliation_strings":["Information Engineering, Guangdong University of Technology, Guangzhou, China","Guangdong University of Technology, China"],"affiliations":[{"raw_affiliation_string":"Information Engineering, Guangdong University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I139024713"]},{"raw_affiliation_string":"Guangdong University of Technology, China","institution_ids":["https://openalex.org/I139024713"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052027147","display_name":"Tianshui Chen","orcid":"https://orcid.org/0000-0002-5848-5624"},"institutions":[{"id":"https://openalex.org/I139024713","display_name":"Guangdong University of Technology","ror":"https://ror.org/04azbjn80","country_code":"CN","type":"education","lineage":["https://openalex.org/I139024713"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tianshui Chen","raw_affiliation_strings":["Information Engineering, Guangdong University of Technology, Guangzhou, China","Guangdong University of Technology, China"],"affiliations":[{"raw_affiliation_string":"Information Engineering, Guangdong University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I139024713"]},{"raw_affiliation_string":"Guangdong University of Technology, China","institution_ids":["https://openalex.org/I139024713"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5115612477"],"corresponding_institution_ids":["https://openalex.org/I139024713"],"apc_list":null,"apc_paid":null,"fwci":1.3503,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.85029071,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"21","issue":"3","first_page":"1","last_page":"19"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9894000291824341,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9159127473831177},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6690595149993896},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6069383025169373},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5125296115875244},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3642094135284424}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9159127473831177},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6690595149993896},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6069383025169373},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5125296115875244},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3642094135284424},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3708991","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3708991","pdf_url":null,"source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.5199999809265137}],"awards":[{"id":"https://openalex.org/G1231421488","display_name":null,"funder_award_id":"under","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1477544716","display_name":null,"funder_award_id":"Guangdong","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1709975844","display_name":null,"funder_award_id":"2022A1515011","funder_id":"https://openalex.org/F4320321921","funder_display_name":"Natural Science Foundation of Guangdong Province"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3753994725","display_name":null,"funder_award_id":"2023A1515012568","funder_id":"https://openalex.org/F4320321921","funder_display_name":"Natural Science Foundation of Guangdong Province"},{"id":"https://openalex.org/G391238517","display_name":null,"funder_award_id":", and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4020255992","display_name":null,"funder_award_id":"Project","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4413561973","display_name":null,"funder_award_id":"2023A15150","funder_id":"https://openalex.org/F4320321921","funder_display_name":"Natural Science Foundation of Guangdong Province"},{"id":"https://openalex.org/G4488680036","display_name":null,"funder_award_id":"2022A15","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4871260389","display_name":null,"funder_award_id":"2023A151","funder_id":"https://openalex.org/F4320321921","funder_display_name":"Natural Science Foundation of Guangdong Province"},{"id":"https://openalex.org/G5248781783","display_name":null,"funder_award_id":"2022A1515011555","funder_id":"https://openalex.org/F4320321921","funder_display_name":"Natural Science Foundation of Guangdong Province"},{"id":"https://openalex.org/G5354582882","display_name":null,"funder_award_id":"51501155","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5543444180","display_name":null,"funder_award_id":"62206314","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5743616050","display_name":null,"funder_award_id":"2024A","funder_id":"https://openalex.org/F4320321921","funder_display_name":"Natural Science Foundation of Guangdong Province"},{"id":"https://openalex.org/G5760752404","display_name":null,"funder_award_id":"Projects","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5939423041","display_name":null,"funder_award_id":"Technology","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7012638997","display_name":null,"funder_award_id":"2023A","funder_id":"https://openalex.org/F4320321921","funder_display_name":"Natural Science Foundation of Guangdong Province"},{"id":"https://openalex.org/G7242000173","display_name":null,"funder_award_id":"62206060","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7726157001","display_name":null,"funder_award_id":"Grant No.","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8863666567","display_name":null,"funder_award_id":"and No.","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321921","display_name":"Natural Science Foundation of Guangdong Province","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W12165144","https://openalex.org/W1861492603","https://openalex.org/W1996953927","https://openalex.org/W2001481583","https://openalex.org/W2031489346","https://openalex.org/W2064675550","https://openalex.org/W2082762663","https://openalex.org/W2194775991","https://openalex.org/W2250539671","https://openalex.org/W2296447001","https://openalex.org/W2932399282","https://openalex.org/W2944205764","https://openalex.org/W2963300078","https://openalex.org/W2963676620","https://openalex.org/W2963745697","https://openalex.org/W2969792713","https://openalex.org/W3034689791","https://openalex.org/W3087020912","https://openalex.org/W3089555680","https://openalex.org/W3198377975","https://openalex.org/W3206041168","https://openalex.org/W3216466215","https://openalex.org/W4214673031","https://openalex.org/W4220818090","https://openalex.org/W4221079634","https://openalex.org/W4225930680","https://openalex.org/W4226179686","https://openalex.org/W4226342448","https://openalex.org/W4229453513","https://openalex.org/W4240153047","https://openalex.org/W4281491955","https://openalex.org/W4286499389","https://openalex.org/W4308104970","https://openalex.org/W4312310776","https://openalex.org/W4312563428","https://openalex.org/W4312648273","https://openalex.org/W4312651322","https://openalex.org/W4312747482","https://openalex.org/W4313331808","https://openalex.org/W4382450414","https://openalex.org/W4386071614","https://openalex.org/W4386113239","https://openalex.org/W4388543952","https://openalex.org/W4392130563"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Multi-label":[0],"recognition":[1],"with":[2,144,182],"partial":[3],"labels":[4,10],"(MLR-PL),":[5],"in":[6,24,36,53,68,78,108],"which":[7,155],"only":[8],"some":[9],"are":[11,15],"known":[12],"while":[13],"others":[14],"unknown":[16],"for":[17,86],"each":[18,151],"image,":[19],"is":[20,34,137,153],"a":[21,98,103,183],"practical":[22],"task":[23,70],"computer":[25],"vision,":[26],"since":[27],"collecting":[28],"large-scale":[29],"and":[30,83,102,167,200],"complete":[31],"multi-label":[32],"datasets":[33,171],"difficult":[35],"real":[37],"application":[38],"scenarios.":[39],"Recently,":[40],"vision":[41],"language":[42],"models":[43],"(e.g.,":[44],"CLIP)":[45],"have":[46],"demonstrated":[47],"impressive":[48],"transferability":[49],"to":[50,72,139,205],"downstream":[51],"tasks":[52],"data":[54],"limited":[55,58],"or":[56],"label":[57],"settings.":[59],"However,":[60],"current":[61,179],"CLIP-based":[62,109,206],"methods":[63,181],"suffer":[64],"from":[65,197],"semantic":[66,99,113,158],"confusion":[67,159],"MLR":[69],"due":[71],"the":[73,79,112,117,126,132,148,157,174],"lack":[74],"of":[75,150],"fine-grained":[76],"information":[77,196],"single":[80],"global":[81],"visual":[82,118,188],"textual":[84],"representation":[85],"all":[87],"categories.":[88],"In":[89],"this":[90,94],"work,":[91],"we":[92],"address":[93],"problem":[95],"by":[96,124],"introducing":[97],"decoupling":[100,114],"module":[101,115],"category-specific":[104,121,133],"prompt":[105,134],"optimization":[106,135],"method":[107,136,193],"framework.":[110],"Specifically,":[111],"following":[116],"encoder":[119],"learns":[120],"feature":[122],"maps":[123],"utilizing":[125],"semantic-guided":[127],"spatial":[128],"attention":[129],"mechanism.":[130],"Moreover,":[131],"introduced":[138],"learn":[140],"text":[141],"representations":[142],"aligned":[143],"category":[145,152],"semantics.":[146],"Therefore,":[147],"prediction":[149],"independent,":[154],"alleviate":[156],"problem.":[160],"Extensive":[161],"experiments":[162],"on":[163],"Microsoft":[164],"COCO":[165],"2014":[166],"Pascal":[168],"VOC":[169],"2007":[170],"demonstrate":[172],"that":[173,191],"proposed":[175],"framework":[176],"significantly":[177],"outperforms":[178],"state-of-art":[180],"simpler":[184],"model":[185],"structure.":[186],"Additionally,":[187],"analysis":[189],"shows":[190],"our":[192],"effectively":[194],"separates":[195],"different":[198],"categories":[199],"achieves":[201],"better":[202],"performance":[203],"compared":[204],"baseline":[207],"method.":[208]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3}],"updated_date":"2026-04-15T08:11:43.952461","created_date":"2025-10-10T00:00:00"}
