{"id":"https://openalex.org/W4304080188","doi":"https://doi.org/10.1145/3503161.3548195","title":"Cross-Modal Retrieval with Heterogeneous Graph Embedding","display_name":"Cross-Modal Retrieval with Heterogeneous Graph Embedding","publication_year":2022,"publication_date":"2022-10-10","ids":{"openalex":"https://openalex.org/W4304080188","doi":"https://doi.org/10.1145/3503161.3548195"},"language":"en","primary_location":{"id":"doi:10.1145/3503161.3548195","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3503161.3548195","pdf_url":null,"source":{"id":"https://openalex.org/S4363608757","display_name":"Proceedings of the 30th ACM International Conference on Multimedia","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100723410","display_name":"Dapeng Chen","orcid":"https://orcid.org/0000-0003-2490-1703"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Dapeng Chen","raw_affiliation_strings":["Huawei Technologies Ltd, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Huawei Technologies Ltd, Shenzhen, China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100340979","display_name":"Min Wang","orcid":"https://orcid.org/0000-0003-3048-6980"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Min Wang","raw_affiliation_strings":["Huawei Technologies Ltd, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Huawei Technologies Ltd, Shenzhen, China","institution_ids":["https://openalex.org/I2250955327"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005004302","display_name":"Haobin Chen","orcid":"https://orcid.org/0000-0003-3111-9824"},"institutions":[{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haobin Chen","raw_affiliation_strings":["Shenzhen Institutes of Advanced Technology, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institutes of Advanced Technology, Shenzhen, China","institution_ids":["https://openalex.org/I4210145761"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083453098","display_name":"Lin Wu","orcid":"https://orcid.org/0000-0001-6119-058X"},"institutions":[{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lin Wu","raw_affiliation_strings":["Hefei University of Technology, Heifei, China"],"affiliations":[{"raw_affiliation_string":"Hefei University of Technology, Heifei, China","institution_ids":["https://openalex.org/I16365422"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005393674","display_name":"Jing Qin","orcid":"https://orcid.org/0000-0002-2961-0860"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Jing Qin","raw_affiliation_strings":["The Hong Kong Polytechnic University, Kowloon, Hong Kong"],"affiliations":[{"raw_affiliation_string":"The Hong Kong Polytechnic University, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053073532","display_name":"Wei Peng","orcid":"https://orcid.org/0000-0002-9572-951X"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Peng","raw_affiliation_strings":["Huawei Technologies Ltd, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Huawei Technologies Ltd, Shenzhen, China","institution_ids":["https://openalex.org/I2250955327"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100723410"],"corresponding_institution_ids":["https://openalex.org/I2250955327"],"apc_list":null,"apc_paid":null,"fwci":2.2188,"has_fulltext":false,"cited_by_count":37,"citation_normalized_percentile":{"value":0.91793811,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"3291","last_page":"3300"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.738559901714325},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.7361609935760498},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.6933656930923462},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6404764652252197},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5430076122283936},{"id":"https://openalex.org/keywords/generality","display_name":"Generality","score":0.49879884719848633},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4916549324989319},{"id":"https://openalex.org/keywords/dual","display_name":"Dual (grammatical number)","score":0.4464591443538666},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.39963293075561523},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.35469627380371094},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3253549635410309}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.738559901714325},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.7361609935760498},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.6933656930923462},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6404764652252197},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5430076122283936},{"id":"https://openalex.org/C2780767217","wikidata":"https://www.wikidata.org/wiki/Q5532421","display_name":"Generality","level":2,"score":0.49879884719848633},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4916549324989319},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.4464591443538666},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.39963293075561523},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35469627380371094},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3253549635410309},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C542102704","wikidata":"https://www.wikidata.org/wiki/Q183257","display_name":"Psychotherapist","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3503161.3548195","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3503161.3548195","pdf_url":null,"source":{"id":"https://openalex.org/S4363608757","display_name":"Proceedings of the 30th ACM International Conference on Multimedia","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.41999998688697815}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W2022322548","https://openalex.org/W2155803963","https://openalex.org/W2187089797","https://openalex.org/W2266728343","https://openalex.org/W2596603442","https://openalex.org/W2743104969","https://openalex.org/W2765440071","https://openalex.org/W2777534232","https://openalex.org/W2808260522","https://openalex.org/W2911286998","https://openalex.org/W2911840101","https://openalex.org/W2954773727","https://openalex.org/W2963187862","https://openalex.org/W2963597983","https://openalex.org/W2963844113","https://openalex.org/W2965857891","https://openalex.org/W2967957126","https://openalex.org/W2970390221","https://openalex.org/W2985033611","https://openalex.org/W2987222078","https://openalex.org/W2997877744","https://openalex.org/W3012871709","https://openalex.org/W3033235266","https://openalex.org/W3034519219","https://openalex.org/W3035241963","https://openalex.org/W3035673257","https://openalex.org/W3198378779","https://openalex.org/W3202750592","https://openalex.org/W3202788649","https://openalex.org/W3204075450","https://openalex.org/W3206241967"],"related_works":["https://openalex.org/W2045049461","https://openalex.org/W1978893398","https://openalex.org/W2201908702","https://openalex.org/W4381094582","https://openalex.org/W2369625323","https://openalex.org/W2364579609","https://openalex.org/W1977906818","https://openalex.org/W1522139108","https://openalex.org/W2353528968","https://openalex.org/W627697492"],"abstract_inverted_index":{"Conventional":[0],"methods":[1],"address":[2],"the":[3,9,23,54,58,71,76,86,105,110,125,130],"cross-modal":[4,43,111],"retrieval":[5,29,122],"problem":[6],"by":[7,103],"projecting":[8],"multi-modal":[10],"data":[11],"into":[12],"a":[13,18,63],"shared":[14],"representation":[15],"space.":[16],"Such":[17],"strategy":[19],"will":[20,50],"inevitably":[21],"lose":[22],"modality-specific":[24],"information,":[25],"leading":[26],"to":[27,39,69,109],"decreased":[28],"accuracy.":[30],"In":[31,61],"this":[32],"paper,":[33],"we":[34],"propose":[35],"heterogeneous":[36,77,98],"graph":[37,99],"embeddings":[38,56],"preserve":[40],"more":[41,79],"abundant":[42],"information.":[44,95],"The":[45,82,96],"embedding":[46,100],"from":[47,57],"one":[48],"modality":[49],"be":[51],"compensated":[52],"with":[53],"aggregated":[55,106],"other":[59],"modality.":[60],"particular,":[62],"self-denoising":[64],"tree":[65],"search":[66],"is":[67,101],"designed":[68],"reduce":[70],"\"label":[72],"noise\"":[73],"problem,":[74,89],"making":[75],"neighborhood":[78],"semantically":[80],"relevant.":[81],"dual-path":[83],"aggregation":[84],"tackles":[85],"\"modality":[87],"imbalance\"":[88],"giving":[90],"each":[91],"sample":[92],"comprehensive":[93],"dual-modality":[94,107],"final":[97],"obtained":[102],"feeding":[104],"features":[108],"self-attention":[112],"module.":[113],"Experiments":[114],"conducted":[115],"on":[116],"cross-modality":[117],"person":[118],"re-identification":[119],"and":[120,127],"image-text":[121],"task":[123],"validate":[124],"superiority":[126],"generality":[128],"of":[129],"proposed":[131],"method.":[132]},"counts_by_year":[{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":11},{"year":2023,"cited_by_count":15},{"year":2022,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
