{"id":"https://openalex.org/W4403582528","doi":"https://doi.org/10.1145/3627673.3679852","title":"M <sup>2</sup> ConceptBase: A Fine-Grained Aligned Concept-Centric Multimodal Knowledge Base","display_name":"M <sup>2</sup> ConceptBase: A Fine-Grained Aligned Concept-Centric Multimodal Knowledge Base","publication_year":2024,"publication_date":"2024-10-20","ids":{"openalex":"https://openalex.org/W4403582528","doi":"https://doi.org/10.1145/3627673.3679852"},"language":"en","primary_location":{"id":"doi:10.1145/3627673.3679852","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3627673.3679852","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056837500","display_name":"Zhiwei Zha","orcid":"https://orcid.org/0009-0002-7005-0372"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhiwei Zha","raw_affiliation_strings":["Shanghai Key Laboratory of Data Science, School of Computer Science, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Laboratory of Data Science, School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062115445","display_name":"Jiaan Wang","orcid":"https://orcid.org/0000-0002-2587-7648"},"institutions":[{"id":"https://openalex.org/I3923682","display_name":"Soochow University","ror":"https://ror.org/05t8y2r12","country_code":"CN","type":"education","lineage":["https://openalex.org/I3923682"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiaan Wang","raw_affiliation_strings":["School of Computer Science and Technology, Soochow University, Suzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Soochow University, Suzhou, China","institution_ids":["https://openalex.org/I3923682"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065529268","display_name":"Zhixu Li","orcid":"https://orcid.org/0000-0003-2355-288X"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhixu Li","raw_affiliation_strings":["Shanghai Key Laboratory of Data Science, School of Computer Science, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Laboratory of Data Science, School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041560675","display_name":"Xiangru Zhu","orcid":"https://orcid.org/0000-0001-7308-3642"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiangru Zhu","raw_affiliation_strings":["Shanghai Key Laboratory of Data Science, School of Computer Science, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Laboratory of Data Science, School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074371475","display_name":"Wei Song","orcid":"https://orcid.org/0000-0002-0828-7486"},"institutions":[{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Song","raw_affiliation_strings":["Research Center for Intelligent Robotics, Zhejiang Lab, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Research Center for Intelligent Robotics, Zhejiang Lab, Hangzhou, China","institution_ids":["https://openalex.org/I4210123185"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090455375","display_name":"Yanghua Xiao","orcid":"https://orcid.org/0000-0001-8403-9591"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanghua Xiao","raw_affiliation_strings":["Shanghai Key Laboratory of Data Science, School of Computer Science, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Laboratory of Data Science, School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5056837500"],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":0.2493,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.54208865,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"3113","last_page":"3123"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6187741160392761},{"id":"https://openalex.org/keywords/knowledge-base","display_name":"Knowledge base","score":0.5535401701927185},{"id":"https://openalex.org/keywords/base","display_name":"Base (topology)","score":0.41131591796875},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.19825071096420288}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6187741160392761},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.5535401701927185},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.41131591796875},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.19825071096420288},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3627673.3679852","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3627673.3679852","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W1964763677","https://openalex.org/W2117539524","https://openalex.org/W2277195237","https://openalex.org/W2560730294","https://openalex.org/W2582830023","https://openalex.org/W2615399484","https://openalex.org/W2947312908","https://openalex.org/W2963870853","https://openalex.org/W3037575487","https://openalex.org/W3171908007","https://openalex.org/W3173220247","https://openalex.org/W3173909648","https://openalex.org/W3199693760","https://openalex.org/W4210493972","https://openalex.org/W4226076338","https://openalex.org/W4230405732","https://openalex.org/W4285294723","https://openalex.org/W4307079201","https://openalex.org/W4385568053","https://openalex.org/W4386065508","https://openalex.org/W4386075723","https://openalex.org/W4391407054","https://openalex.org/W6847076894"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2385713529","https://openalex.org/W2599749361"],"abstract_inverted_index":{"Multimodal":[0],"knowledge":[1,7,25],"bases":[2],"(MMKBs)":[3],"provide":[4],"cross-modal":[5],"aligned":[6],"crucial":[8],"for":[9,21,41],"multimodal":[10,48,78,159],"tasks.":[11],"However,":[12],"the":[13,42,57,145,153],"images":[14,69,96,110],"in":[15,23,166],"existing":[16],"MMKBs":[17],"are":[18,36,39],"generally":[19],"collected":[20],"entities":[22],"encyclopedia":[24],"graphs.":[26],"Therefore,":[27],"detailed":[28,71],"groundings":[29],"of":[30,47,108,158],"visual":[31,43,117],"semantics":[32],"with":[33,67],"linguistic":[34],"concepts":[35,64],"lacking,":[37],"which":[38],"essential":[40],"concept":[44,104,155],"cognition":[45],"ability":[46],"models.":[49],"Addressing":[50],"this":[51],"gap,":[52],"we":[53],"introduce":[54],"M2":[55,61,100,137,148],"ConceptBase,":[56],"first":[58],"concept-centric":[59],"MMKB.":[60],"ConceptBase":[62,101,138,149],"models":[63,162],"as":[65],"nodes":[66],"associated":[68],"and":[70,85,97,111,118],"textual":[72,119],"descriptions.":[73],"We":[74],"propose":[75],"a":[76,112],"context-aware":[77],"symbol":[79],"grounding":[80],"approach":[81],"to":[82,105],"align":[83],"concept-image":[84],"concept-description":[86],"pairs":[87],"using":[88],"context":[89],"information":[90],"from":[91],"image-text":[92],"datasets.":[93],"Comprising":[94],"951K":[95],"152K":[98],"concepts,":[99],"links":[102],"each":[103],"an":[106],"average":[107],"6.27":[109],"single":[113],"description,":[114],"ensuring":[115],"comprehensive":[116],"semantics.":[120],"Human":[121],"studies":[122],"confirm":[123],"more":[124],"than":[125],"95%":[126],"alignment":[127],"accuracy,":[128],"underscoring":[129],"its":[130,171],"quality.":[131],"Additionally,":[132],"our":[133],"experiments":[134],"demonstrate":[135],"that":[136],"significantly":[139],"enhances":[140],"VQA":[141],"model":[142],"performance":[143],"on":[144],"OK-VQA":[146],"task.":[147],"also":[150],"substantially":[151],"improves":[152],"fine-grained":[154],"understanding":[156],"capabilities":[157],"large":[160],"language":[161],"through":[163],"retrieval":[164],"augmentation":[165],"two":[167],"concept-related":[168],"tasks,":[169],"highlighting":[170],"value.":[172]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
