{"id":"https://openalex.org/W3170032237","doi":"https://doi.org/10.1109/icme51207.2021.9428240","title":"Learning Homogeneous and Heterogeneous Co-Occurrences for Unsupervised Cross-Modal Retrieval","display_name":"Learning Homogeneous and Heterogeneous Co-Occurrences for Unsupervised Cross-Modal Retrieval","publication_year":2021,"publication_date":"2021-06-09","ids":{"openalex":"https://openalex.org/W3170032237","doi":"https://doi.org/10.1109/icme51207.2021.9428240","mag":"3170032237"},"language":"en","primary_location":{"id":"doi:10.1109/icme51207.2021.9428240","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme51207.2021.9428240","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026250307","display_name":"Yang Zhao","orcid":"https://orcid.org/0000-0001-7809-6514"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yang Zhao","raw_affiliation_strings":["Nanjing University of Science and Technology,School of Computer Science and Engineering,China","School of Computer Science and Engineering, Nanjing University of Science and Technology, China"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Science and Technology,School of Computer Science and Engineering,China","institution_ids":["https://openalex.org/I36399199"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100734850","display_name":"Weiwei Wang","orcid":"https://orcid.org/0000-0002-6985-2784"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weiwei Wang","raw_affiliation_strings":["Nanjing University of Science and Technology,School of Computer Science and Engineering,China","School of Computer Science and Engineering, Nanjing University of Science and Technology, China"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Science and Technology,School of Computer Science and Engineering,China","institution_ids":["https://openalex.org/I36399199"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064008061","display_name":"Haofeng Zhang","orcid":"https://orcid.org/0000-0002-4039-7618"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haofeng Zhang","raw_affiliation_strings":["Nanjing University of Science and Technology,School of Computer Science and Engineering,China","School of Computer Science and Engineering, Nanjing University of Science and Technology, China"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Science and Technology,School of Computer Science and Engineering,China","institution_ids":["https://openalex.org/I36399199"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Nanjing University of Science and Technology, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031969180","display_name":"Bingzhang Hu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210118681","display_name":"Industry Vision Automation (United States)","ror":"https://ror.org/02pt5ea98","country_code":"US","type":"company","lineage":["https://openalex.org/I4210118681"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bingzhang Hu","raw_affiliation_strings":["Hefei CAS Dihuge Automation Co., LTD.,Vision Intelligence Center","Vision Intelligence Center, Hefei CAS Dihuge Automation Co., LTD"],"affiliations":[{"raw_affiliation_string":"Hefei CAS Dihuge Automation Co., LTD.,Vision Intelligence Center","institution_ids":["https://openalex.org/I4210118681"]},{"raw_affiliation_string":"Vision Intelligence Center, Hefei CAS Dihuge Automation Co., LTD","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5026250307"],"corresponding_institution_ids":["https://openalex.org/I36399199"],"apc_list":null,"apc_paid":null,"fwci":0.5764,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.67712418,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7675172090530396},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.7226374745368958},{"id":"https://openalex.org/keywords/homogeneous","display_name":"Homogeneous","score":0.7041964530944824},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.6375657916069031},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5580111145973206},{"id":"https://openalex.org/keywords/aggregate","display_name":"Aggregate (composite)","score":0.52984619140625},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5004317760467529},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.48379725217819214},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.4625418186187744},{"id":"https://openalex.org/keywords/semantic-matching","display_name":"Semantic matching","score":0.42904454469680786},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.356706827878952},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11118310689926147}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7675172090530396},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.7226374745368958},{"id":"https://openalex.org/C66882249","wikidata":"https://www.wikidata.org/wiki/Q169336","display_name":"Homogeneous","level":2,"score":0.7041964530944824},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.6375657916069031},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5580111145973206},{"id":"https://openalex.org/C4679612","wikidata":"https://www.wikidata.org/wiki/Q866298","display_name":"Aggregate (composite)","level":2,"score":0.52984619140625},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5004317760467529},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.48379725217819214},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.4625418186187744},{"id":"https://openalex.org/C2778493491","wikidata":"https://www.wikidata.org/wiki/Q7449072","display_name":"Semantic matching","level":3,"score":0.42904454469680786},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.356706827878952},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11118310689926147},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icme51207.2021.9428240","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme51207.2021.9428240","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.6800000071525574}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322769","display_name":"Natural Science Foundation of Jiangsu Province","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1861492603","https://openalex.org/W1905882502","https://openalex.org/W2063046703","https://openalex.org/W2185175083","https://openalex.org/W2194775991","https://openalex.org/W2277195237","https://openalex.org/W2346425926","https://openalex.org/W2546696630","https://openalex.org/W2745461083","https://openalex.org/W2774267535","https://openalex.org/W2883311563","https://openalex.org/W2911286998","https://openalex.org/W2962964995","https://openalex.org/W2963040148","https://openalex.org/W2963467339","https://openalex.org/W2963743213","https://openalex.org/W2963919031","https://openalex.org/W2964120214","https://openalex.org/W2973978812","https://openalex.org/W3034336960","https://openalex.org/W4297733535","https://openalex.org/W4385245566","https://openalex.org/W6620707391","https://openalex.org/W6639102338","https://openalex.org/W6693820011","https://openalex.org/W6739901393","https://openalex.org/W6747225742","https://openalex.org/W6767617715"],"related_works":["https://openalex.org/W2385859805","https://openalex.org/W2530972254","https://openalex.org/W2374013449","https://openalex.org/W73545470","https://openalex.org/W2364381299","https://openalex.org/W2374430585","https://openalex.org/W1598955744","https://openalex.org/W3144423903","https://openalex.org/W2377397762","https://openalex.org/W627697492"],"abstract_inverted_index":{"Image-text":[0],"retrieval,":[1],"which":[2,100],"focuses":[3],"on":[4,167,179],"unifying":[5],"both":[6,154],"visual":[7],"and":[8,48,65,92,128,157,182],"textual":[9],"representations,":[10],"is":[11],"one":[12,69],"of":[13,17,30,53,58,81,103,113,126,188],"the":[14,33,40,44,56,60,72,77,138,145,150,161,185,193],"major":[15],"tasks":[16],"cross-modal":[18],"information":[19,79],"processing.":[20],"With":[21],"attention":[22],"mechanism,":[23],"previous":[24],"methods":[25],"performing":[26],"well":[27],"take":[28],"advantage":[29],"not":[31],"only":[32],"correspondence":[34],"in":[35,46,68,110],"image-text":[36,168],"level":[37],"but":[38],"also":[39],"semantic":[41,61,66,174],"alignment":[42],"between":[43,63],"regions":[45,127],"images":[47],"corresponding":[49],"words.":[50],"However,":[51],"few":[52],"them":[54],"comprehend":[55],"importance":[57],"combing":[59],"relationship":[62],"multimodalities":[64],"correspondences":[67,120],"modality":[70,156,159],"at":[71,160],"same":[73,162],"time.":[74],"Inspired":[75],"by":[76],"heterogeneous":[78,82],"learning":[80],"graph":[83],"network,":[84],"we":[85],"propose":[86],"a":[87,111],"novel":[88],"method":[89,147],"called":[90],"Homogeneous":[91,116],"Heterogeneous":[93,132],"Co-Occurrences":[94],"(H":[95],"<inf":[96],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[97],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">2</inf>":[98],"CO)":[99],"mainly":[101],"consists":[102],"two":[104],"modules":[105],"to":[106,136],"achieve":[107],"modal":[108,125,191],"co-occurrence":[109],"query":[112],"corporations.":[114],"Specifically,":[115],"Co-Occurrence":[117,133],"Module":[118,134],"captures":[119],"with":[121],"neighbors":[122,141],"from":[123,153],"single":[124],"words":[129],"respectively,":[130],"while":[131],"aims":[135],"learn":[137],"relations":[139],"about":[140],"across":[142],"modalities.":[143],"Finally,":[144],"proposed":[146,190],"can":[148],"aggregate":[149],"neighborhood":[151],"features":[152],"intra":[155],"inter":[158],"time,":[163],"thus":[164],"performs":[165],"better":[166],"matching":[169],"for":[170],"considering":[171],"much":[172],"more":[173],"information.":[175],"Extensive":[176],"experimental":[177],"results":[178],"MS":[180],"COCO":[181],"Flickr30K":[183],"show":[184],"superior":[186],"performance":[187],"our":[189],"over":[192],"state-of-the-arts.":[194]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
