{"id":"https://openalex.org/W4399418657","doi":"https://doi.org/10.1145/3651671.3651674","title":"Multi-modal Contextual Prompt Learning for Multi-label Classification with Partial Labels","display_name":"Multi-modal Contextual Prompt Learning for Multi-label Classification with Partial Labels","publication_year":2024,"publication_date":"2024-02-02","ids":{"openalex":"https://openalex.org/W4399418657","doi":"https://doi.org/10.1145/3651671.3651674"},"language":"en","primary_location":{"id":"doi:10.1145/3651671.3651674","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3651671.3651674","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 16th International Conference on Machine Learning and Computing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5092516477","display_name":"Rui Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I1328775524","display_name":"Zhejiang Sci-Tech University","ror":"https://ror.org/03893we55","country_code":"CN","type":"education","lineage":["https://openalex.org/I1328775524"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Rui Wang","raw_affiliation_strings":["School of Computer Science and Technology, Zhejiang Sci-Tech University, China"],"raw_orcid":"https://orcid.org/0009-0002-6027-1091","affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Zhejiang Sci-Tech University, China","institution_ids":["https://openalex.org/I1328775524"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005961599","display_name":"Zhengxin Pan","orcid":"https://orcid.org/0000-0003-2003-0728"},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhengxin Pan","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University, China"],"raw_orcid":"https://orcid.org/0000-0003-2003-0728","affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University, China","institution_ids":["https://openalex.org/I168879160"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026986847","display_name":"Fangyu Wu","orcid":"https://orcid.org/0000-0001-9618-8965"},"institutions":[{"id":"https://openalex.org/I69356397","display_name":"Xi\u2019an Jiaotong-Liverpool University","ror":"https://ror.org/03zmrmn05","country_code":"CN","type":"education","lineage":["https://openalex.org/I69356397"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fangyu Wu","raw_affiliation_strings":["School of Advanced Technology, Xi'an-Jiaotong Liverpool University, China"],"raw_orcid":"https://orcid.org/0000-0001-9618-8965","affiliations":[{"raw_affiliation_string":"School of Advanced Technology, Xi'an-Jiaotong Liverpool University, China","institution_ids":["https://openalex.org/I69356397"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113242654","display_name":"Yifan Lv","orcid":null},"institutions":[{"id":"https://openalex.org/I159389169","display_name":"Ningbo University of Technology","ror":"https://ror.org/037dym702","country_code":"CN","type":"education","lineage":["https://openalex.org/I159389169"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yifan Lv","raw_affiliation_strings":["School of Computing and Data Engineering, NingboTech University, China"],"raw_orcid":"https://orcid.org/0000-0002-8045-9932","affiliations":[{"raw_affiliation_string":"School of Computing and Data Engineering, NingboTech University, China","institution_ids":["https://openalex.org/I159389169"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101991543","display_name":"Bailing Zhang","orcid":"https://orcid.org/0000-0001-5762-5763"},"institutions":[{"id":"https://openalex.org/I159389169","display_name":"Ningbo University of Technology","ror":"https://ror.org/037dym702","country_code":"CN","type":"education","lineage":["https://openalex.org/I159389169"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bailing Zhang","raw_affiliation_strings":["School of Computing and Data Engineering, NingboTech University, China"],"raw_orcid":"https://orcid.org/0000-0001-5762-5763","affiliations":[{"raw_affiliation_string":"School of Computing and Data Engineering, NingboTech University, China","institution_ids":["https://openalex.org/I159389169"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5092516477"],"corresponding_institution_ids":["https://openalex.org/I1328775524"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.06234195,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"517","last_page":"524"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.831356406211853},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.611513614654541},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6103826761245728},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.563865602016449},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5612573027610779},{"id":"https://openalex.org/keywords/multi-label-classification","display_name":"Multi-label classification","score":0.531419038772583},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5185573697090149},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.44241276383399963},{"id":"https://openalex.org/keywords/contextual-image-classification","display_name":"Contextual image classification","score":0.4222835898399353},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.39886072278022766},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3729533851146698}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.831356406211853},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.611513614654541},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6103826761245728},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.563865602016449},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5612573027610779},{"id":"https://openalex.org/C2776482837","wikidata":"https://www.wikidata.org/wiki/Q3553958","display_name":"Multi-label classification","level":2,"score":0.531419038772583},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5185573697090149},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.44241276383399963},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.4222835898399353},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.39886072278022766},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3729533851146698},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3651671.3651674","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3651671.3651674","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 16th International Conference on Machine Learning and Computing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W12165144","https://openalex.org/W1861492603","https://openalex.org/W1996953927","https://openalex.org/W2001481583","https://openalex.org/W2031489346","https://openalex.org/W2108598243","https://openalex.org/W2146241755","https://openalex.org/W2194775991","https://openalex.org/W2549365021","https://openalex.org/W2867270703","https://openalex.org/W2932399282","https://openalex.org/W2963300078","https://openalex.org/W2963676620","https://openalex.org/W2963703197","https://openalex.org/W2963745697","https://openalex.org/W2969792713","https://openalex.org/W2982112268","https://openalex.org/W2998420437","https://openalex.org/W3034689791","https://openalex.org/W3034978279","https://openalex.org/W3045700442","https://openalex.org/W3087020912","https://openalex.org/W3089555680","https://openalex.org/W3135367836","https://openalex.org/W3138516171","https://openalex.org/W3165691894","https://openalex.org/W3198377975","https://openalex.org/W4214673031","https://openalex.org/W4225930680","https://openalex.org/W4226342448","https://openalex.org/W4229453513","https://openalex.org/W4283313485","https://openalex.org/W4312310776","https://openalex.org/W4312420092","https://openalex.org/W4312648273"],"related_works":["https://openalex.org/W17155033","https://openalex.org/W3207760230","https://openalex.org/W1496222301","https://openalex.org/W1590307681","https://openalex.org/W2536018345","https://openalex.org/W4312814274","https://openalex.org/W4285370786","https://openalex.org/W4205999209","https://openalex.org/W2735080633","https://openalex.org/W4387801808"],"abstract_inverted_index":{"Multi-label":[0],"classification":[1,26,104],"is":[2],"a":[3,43,74],"task":[4],"with":[5,27,109],"diverse":[6],"applications,":[7],"but":[8],"current":[9],"algorithms":[10],"heavily":[11],"rely":[12],"on":[13,73,135],"accurately":[14],"labeled":[15,90],"data,":[16],"leading":[17],"to":[18,59,92,118],"time-consuming":[19],"and":[20,51,89,123,138,144],"labor-intensive":[21],"data":[22],"collection.":[23],"However,":[24],"multi-label":[25,103],"partial":[28,110],"labels":[29],"presents":[30],"significant":[31],"challenges.":[32],"In":[33],"this":[34],"study,":[35],"we":[36],"propose":[37],"Multi-modal":[38],"Contextual":[39],"Prompt":[40],"Learning":[41],"(MCPL),":[42],"novel":[44],"approach":[45],"that":[46],"leverages":[47],"large-scale":[48],"visual-language":[49],"models":[50],"exploits":[52],"the":[53,61,68,95,115,120,125,129,136],"strong":[54],"image-text":[55,78],"alignment":[56],"in":[57,86,101],"CLIP":[58],"address":[60],"scarcity":[62],"of":[63,77,128],"label":[64],"annotations.":[65],"We":[66,80,112],"pre-train":[67],"visual":[69],"language":[70],"model\u2019s":[71],"encoder":[72],"large":[75],"number":[76],"pairs.":[79],"introduce":[81],"multi-modal":[82],"contextual":[83],"prompt":[84],"learning":[85],"both":[87],"images":[88],"text":[91],"better":[93],"utilize":[94],"image-label":[96],"correspondence":[97],"within":[98],"CLIP,":[99],"resulting":[100],"enhanced":[102],"performance,":[105],"even":[106],"when":[107],"faced":[108],"labels.":[111],"also":[113],"use":[114],"coupling":[116],"function":[117],"couple":[119],"two":[121,130],"modes":[122],"realize":[124],"interactive":[126],"connection":[127],"modal":[131],"prompts.":[132],"Extensive":[133],"experiments":[134],"MS-COCO":[137],"VOC2007":[139],"datasets,":[140],"demonstrating":[141],"its":[142],"superiority":[143],"achieving":[145],"competitive":[146],"performance.":[147]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
