{"id":"https://openalex.org/W3200159660","doi":"https://doi.org/10.1109/ijcnn52387.2021.9534428","title":"Multi-Modal Multi-Instance Multi-Label Learning with Graph Convolutional Network","display_name":"Multi-Modal Multi-Instance Multi-Label Learning with Graph Convolutional Network","publication_year":2021,"publication_date":"2021-07-18","ids":{"openalex":"https://openalex.org/W3200159660","doi":"https://doi.org/10.1109/ijcnn52387.2021.9534428","mag":"3200159660"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn52387.2021.9534428","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn52387.2021.9534428","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110680372","display_name":"Cheng Hang","orcid":null},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Cheng Hang","raw_affiliation_strings":["State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100391855","display_name":"Wei Wang","orcid":"https://orcid.org/0000-0002-0707-8076"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Wang","raw_affiliation_strings":["State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073912249","display_name":"De\u2010Chuan Zhan","orcid":"https://orcid.org/0000-0002-3533-2078"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"De-Chuan Zhan","raw_affiliation_strings":["State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory for Novel Software Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5110680372"],"corresponding_institution_ids":["https://openalex.org/I881766915"],"apc_list":null,"apc_paid":null,"fwci":0.2719,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.63436921,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":"10","issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8178195953369141},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6328245401382446},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5800186991691589},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5314100384712219},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5122575163841248},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5110355615615845},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.4576820433139801},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.357942670583725},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.22661080956459045}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8178195953369141},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6328245401382446},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5800186991691589},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5314100384712219},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5122575163841248},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5110355615615845},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.4576820433139801},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.357942670583725},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.22661080956459045},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn52387.2021.9534428","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn52387.2021.9534428","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W125678093","https://openalex.org/W562660536","https://openalex.org/W639708223","https://openalex.org/W1523738436","https://openalex.org/W1900086069","https://openalex.org/W1996462768","https://openalex.org/W1999954155","https://openalex.org/W2047221353","https://openalex.org/W2050826493","https://openalex.org/W2052684427","https://openalex.org/W2079221635","https://openalex.org/W2121625657","https://openalex.org/W2126250169","https://openalex.org/W2133288557","https://openalex.org/W2134604967","https://openalex.org/W2156935079","https://openalex.org/W2176228818","https://openalex.org/W2183087644","https://openalex.org/W2293549417","https://openalex.org/W2584931758","https://openalex.org/W2613718673","https://openalex.org/W2785934082","https://openalex.org/W2808958151","https://openalex.org/W2932399282","https://openalex.org/W2962767366","https://openalex.org/W2964015378","https://openalex.org/W2964069537","https://openalex.org/W4294558607","https://openalex.org/W6605125263","https://openalex.org/W6615672858","https://openalex.org/W6620707391","https://openalex.org/W6631340511","https://openalex.org/W6663358622","https://openalex.org/W6670567483","https://openalex.org/W6679066655","https://openalex.org/W6685347822","https://openalex.org/W6685974025","https://openalex.org/W6696941056","https://openalex.org/W6726873649","https://openalex.org/W6736095516","https://openalex.org/W6738964360","https://openalex.org/W6747701563"],"related_works":["https://openalex.org/W2378211422","https://openalex.org/W2745001401","https://openalex.org/W4321353415","https://openalex.org/W2130974462","https://openalex.org/W972276598","https://openalex.org/W4246352526","https://openalex.org/W2028665553","https://openalex.org/W2086519370","https://openalex.org/W2087343574","https://openalex.org/W2121910908"],"abstract_inverted_index":{"When":[0],"applying":[1],"machine":[2],"learning":[3,83,90],"to":[4,11,137,163],"tackle":[5],"realworld":[6],"problems,":[7],"it":[8,56,156,160,188],"is":[9,57,96,116,124,136,150,189],"common":[10],"see":[12],"that":[13,92,103,194],"objects":[14,27],"come":[15],"with":[16,73],"multiple":[17,32,69],"labels":[18,120],"rather":[19],"than":[20],"a":[21,35,53,114],"single":[22],"label.":[23],"In":[24,98],"addition,":[25],"complex":[26],"can":[28,105],"be":[29],"composed":[30],"of":[31,184],"modalities,":[33],"e.g.":[34],"post":[36,66],"on":[37,152,174],"social":[38],"media":[39],"may":[40,67],"contain":[41,68],"both":[42,175],"texts":[43,72],"and":[44,71,121,178,187],"images.":[45],"Previous":[46,86],"approaches":[47],"typically":[48],"treat":[49],"every":[50,65],"modality":[51],"as":[52,64],"whole,":[54],"while":[55],"not":[58],"the":[59,168,182,195],"case":[60],"in":[61,191,197],"real":[62],"world,":[63],"images":[70],"quite":[74],"diverse":[75],"semantic":[76],"meanings.":[77],"Therefore,":[78],"Multi-modal":[79],"Multi-instance":[80],"Multi-label":[81],"(M3)":[82],"was":[84],"proposed.":[85],"attempt":[87],"at":[88],"M3":[89,107],"argues":[91],"exploiting":[93],"label":[94,123,140,145],"correlations":[95],"crucial.":[97],"this":[99],"paper,":[100],"we":[101,104],"find":[102],"handle":[106],"problems":[108],"using":[109],"graph":[110,115],"convolutional":[111],"network.":[112],"Specifically,":[113],"built":[117],"over":[118],"all":[119],"each":[122],"initially":[125],"represented":[126],"by":[127],"its":[128],"word":[129],"embedding.":[130],"The":[131],"main":[132],"goal":[133],"for":[134],"GCN":[135],"map":[138],"those":[139],"embed":[141],"dings":[142],"into":[143],"inter-correlated":[144],"classifiers.":[146],"Moreover,":[147],"multi-instance":[148],"aggregation":[149],"based":[151],"attention":[153],"mechanism,":[154],"making":[155],"more":[157],"interpretable":[158],"because":[159],"naturally":[161],"learns":[162],"discover":[164],"which":[165],"pattern":[166],"triggers":[167],"labels.":[169],"Empirical":[170],"studies":[171,193],"are":[172,200],"conducted":[173],"benchmark":[176],"datasets":[177],"industrial":[179],"datasets,":[180],"validating":[181],"effectiveness":[183],"our":[185,198],"method,":[186],"demonstrated":[190],"ablation":[192],"components":[196],"methods":[199],"essential.":[201]},"counts_by_year":[{"year":2022,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
