{"id":"https://openalex.org/W4200632612","doi":"https://doi.org/10.1109/tnnls.2021.3135420","title":"Multimodal Mutual Information Maximization: A Novel Approach for Unsupervised Deep Cross-Modal Hashing","display_name":"Multimodal Mutual Information Maximization: A Novel Approach for Unsupervised Deep Cross-Modal Hashing","publication_year":2022,"publication_date":"2022-01-04","ids":{"openalex":"https://openalex.org/W4200632612","doi":"https://doi.org/10.1109/tnnls.2021.3135420","pmid":"https://pubmed.ncbi.nlm.nih.gov/34982698"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2021.3135420","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2021.3135420","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080253938","display_name":"Tuan Hoang","orcid":"https://orcid.org/0000-0002-1076-8043"},"institutions":[{"id":"https://openalex.org/I152815399","display_name":"Singapore University of Technology and Design","ror":"https://ror.org/05j6fvn87","country_code":"SG","type":"education","lineage":["https://openalex.org/I152815399"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Tuan Hoang","raw_affiliation_strings":["Information System Technology and Design (ISTD), Singapore University of Technology and Design (SUTD), Singapore"],"affiliations":[{"raw_affiliation_string":"Information System Technology and Design (ISTD), Singapore University of Technology and Design (SUTD), Singapore","institution_ids":["https://openalex.org/I152815399"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025723803","display_name":"Thanh-Toan Do","orcid":"https://orcid.org/0000-0002-6249-0848"},"institutions":[{"id":"https://openalex.org/I56590836","display_name":"Monash University","ror":"https://ror.org/02bfwt286","country_code":"AU","type":"education","lineage":["https://openalex.org/I56590836"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Thanh-Toan Do","raw_affiliation_strings":["Department of Data Science and AI, Faculty of Information Technology, Monash University, Clayton, VIC, Australia"],"affiliations":[{"raw_affiliation_string":"Department of Data Science and AI, Faculty of Information Technology, Monash University, Clayton, VIC, Australia","institution_ids":["https://openalex.org/I56590836"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022799473","display_name":"Tam Nguyen","orcid":"https://orcid.org/0000-0003-0236-7992"},"institutions":[{"id":"https://openalex.org/I127591826","display_name":"University of Dayton","ror":"https://ror.org/021v3qy27","country_code":"US","type":"education","lineage":["https://openalex.org/I127591826"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tam V. Nguyen","raw_affiliation_strings":["Department of Computer Science, University of Dayton, Dayton, OH, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Dayton, Dayton, OH, USA","institution_ids":["https://openalex.org/I127591826"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057453537","display_name":"Ngai\u2010Man Cheung","orcid":"https://orcid.org/0000-0003-0135-3791"},"institutions":[{"id":"https://openalex.org/I152815399","display_name":"Singapore University of Technology and Design","ror":"https://ror.org/05j6fvn87","country_code":"SG","type":"education","lineage":["https://openalex.org/I152815399"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Ngai-Man Cheung","raw_affiliation_strings":["Information System Technology and Design (ISTD), Singapore University of Technology and Design (SUTD), Singapore"],"affiliations":[{"raw_affiliation_string":"Information System Technology and Design (ISTD), Singapore University of Technology and Design (SUTD), Singapore","institution_ids":["https://openalex.org/I152815399"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5080253938"],"corresponding_institution_ids":["https://openalex.org/I152815399"],"apc_list":null,"apc_paid":null,"fwci":4.131,"has_fulltext":false,"cited_by_count":43,"citation_normalized_percentile":{"value":0.9522718,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"34","issue":"9","first_page":"6289","last_page":"6302"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9861999750137329,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6891757249832153},{"id":"https://openalex.org/keywords/hash-function","display_name":"Hash function","score":0.6366580128669739},{"id":"https://openalex.org/keywords/mutual-information","display_name":"Mutual information","score":0.6343854069709778},{"id":"https://openalex.org/keywords/binary-number","display_name":"Binary number","score":0.5976188778877258},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5301740169525146},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.5100653767585754},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.48173239827156067},{"id":"https://openalex.org/keywords/binary-code","display_name":"Binary code","score":0.4756224453449249},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.4718867540359497},{"id":"https://openalex.org/keywords/maximization","display_name":"Maximization","score":0.4532037079334259},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.45025479793548584},{"id":"https://openalex.org/keywords/universal-hashing","display_name":"Universal hashing","score":0.4285750687122345},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3901676535606384},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3684789538383484},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3589433431625366},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1652105450630188},{"id":"https://openalex.org/keywords/double-hashing","display_name":"Double hashing","score":0.14914646744728088},{"id":"https://openalex.org/keywords/hash-table","display_name":"Hash table","score":0.14183929562568665},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.1230154037475586},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.11529448628425598}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6891757249832153},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.6366580128669739},{"id":"https://openalex.org/C152139883","wikidata":"https://www.wikidata.org/wiki/Q252973","display_name":"Mutual information","level":2,"score":0.6343854069709778},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.5976188778877258},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5301740169525146},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.5100653767585754},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.48173239827156067},{"id":"https://openalex.org/C63435697","wikidata":"https://www.wikidata.org/wiki/Q864135","display_name":"Binary code","level":3,"score":0.4756224453449249},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.4718867540359497},{"id":"https://openalex.org/C2776330181","wikidata":"https://www.wikidata.org/wiki/Q18358244","display_name":"Maximization","level":2,"score":0.4532037079334259},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.45025479793548584},{"id":"https://openalex.org/C116058348","wikidata":"https://www.wikidata.org/wiki/Q846912","display_name":"Universal hashing","level":5,"score":0.4285750687122345},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3901676535606384},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3684789538383484},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3589433431625366},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1652105450630188},{"id":"https://openalex.org/C138111711","wikidata":"https://www.wikidata.org/wiki/Q478351","display_name":"Double hashing","level":4,"score":0.14914646744728088},{"id":"https://openalex.org/C67388219","wikidata":"https://www.wikidata.org/wiki/Q207440","display_name":"Hash table","level":3,"score":0.14183929562568665},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.1230154037475586},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.11529448628425598},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2021.3135420","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2021.3135420","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:34982698","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/34982698","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G405023977","display_name":null,"funder_award_id":"AISG-100E2018-005","funder_id":"https://openalex.org/F4320320709","funder_display_name":"National Research Foundation Singapore"},{"id":"https://openalex.org/G6231721661","display_name":null,"funder_award_id":"PIE-SGP-AI-2018-01","funder_id":"https://openalex.org/F4320324110","funder_display_name":"Singapore University of Technology and Design"}],"funders":[{"id":"https://openalex.org/F4320320709","display_name":"National Research Foundation Singapore","ror":"https://ror.org/03cpyc314"},{"id":"https://openalex.org/F4320324110","display_name":"Singapore University of Technology and Design","ror":"https://ror.org/05j6fvn87"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":88,"referenced_works":["https://openalex.org/W1489116628","https://openalex.org/W1861492603","https://openalex.org/W1922199343","https://openalex.org/W1964073652","https://openalex.org/W1974647172","https://openalex.org/W2007972815","https://openalex.org/W2044195942","https://openalex.org/W2049993534","https://openalex.org/W2086958058","https://openalex.org/W2095439994","https://openalex.org/W2155803963","https://openalex.org/W2159373756","https://openalex.org/W2166944917","https://openalex.org/W2199369932","https://openalex.org/W2203543769","https://openalex.org/W2251084241","https://openalex.org/W2266728343","https://openalex.org/W2345649690","https://openalex.org/W2345891614","https://openalex.org/W2388114291","https://openalex.org/W2476034201","https://openalex.org/W2482105843","https://openalex.org/W2510661833","https://openalex.org/W2512032049","https://openalex.org/W2591669147","https://openalex.org/W2602646780","https://openalex.org/W2604880013","https://openalex.org/W2613332842","https://openalex.org/W2733636222","https://openalex.org/W2748725735","https://openalex.org/W2759194679","https://openalex.org/W2765440071","https://openalex.org/W2788843501","https://openalex.org/W2795832645","https://openalex.org/W2799150641","https://openalex.org/W2808243243","https://openalex.org/W2842511635","https://openalex.org/W2889024947","https://openalex.org/W2891193211","https://openalex.org/W2894874917","https://openalex.org/W2894879246","https://openalex.org/W2898403805","https://openalex.org/W2901281242","https://openalex.org/W2905040928","https://openalex.org/W2907166662","https://openalex.org/W2941765879","https://openalex.org/W2953037339","https://openalex.org/W2962793481","https://openalex.org/W2962804981","https://openalex.org/W2962955826","https://openalex.org/W2963187862","https://openalex.org/W2963288100","https://openalex.org/W2963340196","https://openalex.org/W2963916624","https://openalex.org/W2967862025","https://openalex.org/W2976061040","https://openalex.org/W2982223282","https://openalex.org/W2982905682","https://openalex.org/W2985346367","https://openalex.org/W2999606372","https://openalex.org/W3011997138","https://openalex.org/W3034890701","https://openalex.org/W3049577264","https://openalex.org/W3081175302","https://openalex.org/W3108655343","https://openalex.org/W3176403475","https://openalex.org/W4243316134","https://openalex.org/W6604628494","https://openalex.org/W6608183366","https://openalex.org/W6637108112","https://openalex.org/W6684115544","https://openalex.org/W6684191040","https://openalex.org/W6685282478","https://openalex.org/W6693399182","https://openalex.org/W6697214482","https://openalex.org/W6717434760","https://openalex.org/W6718140377","https://openalex.org/W6721087566","https://openalex.org/W6729906282","https://openalex.org/W6730091202","https://openalex.org/W6735799286","https://openalex.org/W6748223763","https://openalex.org/W6752051073","https://openalex.org/W6754278344","https://openalex.org/W6755207826","https://openalex.org/W6762796984","https://openalex.org/W6762915377","https://openalex.org/W6771610787"],"related_works":["https://openalex.org/W2132034299","https://openalex.org/W3124800526","https://openalex.org/W4251536634","https://openalex.org/W1551533237","https://openalex.org/W2185281229","https://openalex.org/W1750955152","https://openalex.org/W43986179","https://openalex.org/W4319653630","https://openalex.org/W3192973254","https://openalex.org/W2088296667"],"abstract_inverted_index":{"In":[0],"this":[1],"article,":[2],"we":[3,49,97,119],"adopt":[4],"the":[5,13,51,63,66,85,88,126,135,151,161,173],"maximizing":[6,62,81],"mutual":[7],"information":[8,157],"(MI)":[9],"approach":[10],"to":[11,37,61,124],"tackle":[12],"problem":[14],"of":[15,18,59,76],"unsupervised":[16],"learning":[17,130],"binary":[19,67,74,89,100,132],"hash":[20],"codes":[21],"for":[22,134,160],"efficient":[23],"cross-modal":[24,32,162,180],"retrieval.":[25],"We":[26],"proposed":[27,174],"a":[28,112],"novel":[29],"method,":[30],"dubbed":[31],"info-max":[33],"hashing":[34],"(CMIMH).":[35],"First,":[36],"learn":[38,99],"informative":[39,145],"representations":[40,68,75,90,133],"that":[41,87,122,172],"can":[42,98,103],"preserve":[43,104],"both":[44,105],"intramodal":[45,106],"and":[46,69,72,107,154],"intermodal":[47,108],"similarities,":[48,109],"leverage":[50],"recent":[52],"advances":[53],"in":[54,111,143],"estimating":[55],"variational":[56],"lower":[57],"bound":[58],"MI":[60,64],"between":[65,73,149],"input":[70],"features":[71],"different":[77,139],"modalities.":[78],"By":[79],"jointly":[80],"these":[82],"MIs":[83],"under":[84],"assumption":[86],"are":[91],"modeled":[92],"by":[93,129],"multivariate":[94],"Bernoulli":[95],"distributions,":[96],"representations,":[101],"which":[102],"effectively":[110],"mini-batch":[113],"manner":[114],"with":[115],"gradient":[116],"descent.":[117],"Furthermore,":[118],"find":[120],"out":[121],"trying":[123],"minimize":[125],"modality":[127,152],"gap":[128,153],"similar":[131],"same":[136],"instance":[137],"from":[138],"modalities":[140],"could":[141],"result":[142],"less":[144],"representations.":[146],"Hence,":[147],"balancing":[148],"reducing":[150],"losing":[155],"modality-private":[156],"is":[158],"important":[159],"retrieval":[163,181],"tasks.":[164],"Quantitative":[165],"evaluations":[166],"on":[167],"standard":[168],"benchmark":[169],"datasets":[170],"demonstrate":[171],"method":[175],"consistently":[176],"outperforms":[177],"other":[178],"state-of-the-art":[179],"methods.":[182]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":12},{"year":2024,"cited_by_count":15},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":6}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
