{"id":"https://openalex.org/W7125937060","doi":"https://doi.org/10.1109/smc58881.2025.11343568","title":"Deep Multi-Feature Hash Networks for Image-Text Retrieval","display_name":"Deep Multi-Feature Hash Networks for Image-Text Retrieval","publication_year":2025,"publication_date":"2025-10-05","ids":{"openalex":"https://openalex.org/W7125937060","doi":"https://doi.org/10.1109/smc58881.2025.11343568"},"language":null,"primary_location":{"id":"doi:10.1109/smc58881.2025.11343568","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc58881.2025.11343568","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5124082957","display_name":"Zheng Dong","orcid":null},"institutions":[{"id":"https://openalex.org/I152269853","display_name":"Qilu University of Technology","ror":"https://ror.org/04hyzq608","country_code":"CN","type":"education","lineage":["https://openalex.org/I152269853"]},{"id":"https://openalex.org/I4210142748","display_name":"Shandong Academy of Sciences","ror":"https://ror.org/04y8d6y55","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zheng Dong","raw_affiliation_strings":["Qilu University of Technology (Shandong Academy of Sciences),Key Laboratory of Computing Power Network and Information Security, Ministry of Education, Shandong Computer Science Center,Jinan,China"],"affiliations":[{"raw_affiliation_string":"Qilu University of Technology (Shandong Academy of Sciences),Key Laboratory of Computing Power Network and Information Security, Ministry of Education, Shandong Computer Science Center,Jinan,China","institution_ids":["https://openalex.org/I152269853","https://openalex.org/I4210142748"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124122628","display_name":"Ruijia Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I152269853","display_name":"Qilu University of Technology","ror":"https://ror.org/04hyzq608","country_code":"CN","type":"education","lineage":["https://openalex.org/I152269853"]},{"id":"https://openalex.org/I4210142748","display_name":"Shandong Academy of Sciences","ror":"https://ror.org/04y8d6y55","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruijia Zhang","raw_affiliation_strings":["Qilu University of Technology (Shandong Academy of Sciences),Key Laboratory of Computing Power Network and Information Security, Ministry of Education, Shandong Computer Science Center,Jinan,China"],"affiliations":[{"raw_affiliation_string":"Qilu University of Technology (Shandong Academy of Sciences),Key Laboratory of Computing Power Network and Information Security, Ministry of Education, Shandong Computer Science Center,Jinan,China","institution_ids":["https://openalex.org/I152269853","https://openalex.org/I4210142748"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112934807","display_name":"Qin Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I152269853","display_name":"Qilu University of Technology","ror":"https://ror.org/04hyzq608","country_code":"CN","type":"education","lineage":["https://openalex.org/I152269853"]},{"id":"https://openalex.org/I4210142748","display_name":"Shandong Academy of Sciences","ror":"https://ror.org/04y8d6y55","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qin Lu","raw_affiliation_strings":["Qilu University of Technology (Shandong Academy of Sciences),Key Laboratory of Computing Power Network and Information Security, Ministry of Education, Shandong Computer Science Center,Jinan,China"],"affiliations":[{"raw_affiliation_string":"Qilu University of Technology (Shandong Academy of Sciences),Key Laboratory of Computing Power Network and Information Security, Ministry of Education, Shandong Computer Science Center,Jinan,China","institution_ids":["https://openalex.org/I152269853","https://openalex.org/I4210142748"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5124082957"],"corresponding_institution_ids":["https://openalex.org/I152269853","https://openalex.org/I4210142748"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.7158954,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"7645","last_page":"7650"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9362000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9362000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.014000000432133675,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.004100000020116568,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hash-function","display_name":"Hash function","score":0.7182000279426575},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.5569999814033508},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5170999765396118},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5131000280380249},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4846999943256378},{"id":"https://openalex.org/keywords/semantic-feature","display_name":"Semantic feature","score":0.44589999318122864},{"id":"https://openalex.org/keywords/feature-hashing","display_name":"Feature hashing","score":0.42320001125335693},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.39719998836517334}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8151999711990356},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.7182000279426575},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.5569999814033508},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5200999975204468},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5170999765396118},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5131000280380249},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4846999943256378},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.44589999318122864},{"id":"https://openalex.org/C133667856","wikidata":"https://www.wikidata.org/wiki/Q5439682","display_name":"Feature hashing","level":5,"score":0.42320001125335693},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.39719998836517334},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.37130001187324524},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35670000314712524},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.353300005197525},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.3508000075817108},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3158000111579895},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3109999895095825},{"id":"https://openalex.org/C63435697","wikidata":"https://www.wikidata.org/wiki/Q864135","display_name":"Binary code","level":3,"score":0.2896000146865845},{"id":"https://openalex.org/C86034646","wikidata":"https://www.wikidata.org/wiki/Q474311","display_name":"Semantic gap","level":4,"score":0.2838999927043915},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.2784000039100647},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.2696000039577484},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.26919999718666077},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2583000063896179}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/smc58881.2025.11343568","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc58881.2025.11343568","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W2007972815","https://openalex.org/W2155803963","https://openalex.org/W2266728343","https://openalex.org/W2277195237","https://openalex.org/W2346746376","https://openalex.org/W2531409750","https://openalex.org/W2788843501","https://openalex.org/W2802864907","https://openalex.org/W2963988212","https://openalex.org/W2982905682","https://openalex.org/W2999606372","https://openalex.org/W3012050760","https://openalex.org/W3033799362","https://openalex.org/W3035747010","https://openalex.org/W3098766884","https://openalex.org/W3100847621","https://openalex.org/W3175740157","https://openalex.org/W3209532803","https://openalex.org/W4210882633","https://openalex.org/W4304092731","https://openalex.org/W4383503840"],"related_works":[],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"cross-modal":[3,39,84,191,229],"image-text":[4,249],"retrieval":[5,50,61,85,224],"has":[6,29],"gained":[7],"significant":[8],"attention":[9],"due":[10],"to":[11,14,47,78,119,137,151],"its":[12],"ability":[13],"efficiently":[15],"retrieve":[16],"semantically":[17],"relevant":[18],"information":[19,142],"from":[20],"large-scale":[21],"multimedia":[22],"data.":[23],"The":[24,91,108],"rise":[25],"of":[26,93,143],"deep":[27,72],"learning":[28],"provided":[30],"new":[31],"perspectives":[32],"for":[33],"addressing":[34],"the":[35,97,100,131,139,171,185],"heterogeneity":[36],"challenge":[37],"in":[38,96,128,248],"retrieval.":[40],"However,":[41],"existing":[42,253],"hashing":[43,74,210],"methods":[44],"often":[45],"struggle":[46],"balance":[48],"efficient":[49,81],"with":[51,115,160],"fine-grained":[52,83,204],"semantic":[53,57,205,230],"alignment":[54],"and":[55,82,104,125,181,199,214,237],"global":[56,123,140,158],"understanding,":[58],"thereby":[59],"limiting":[60],"accuracy.":[62],"To":[63],"tackle":[64],"these":[65],"challenges,":[66],"this":[67],"paper":[68],"proposes":[69],"a":[70,105,165,190,208],"novel":[71],"multi-feature":[73],"network":[75],"(DMFHN),":[76],"designed":[77],"achieve":[79],"both":[80,122],"through":[86],"compact":[87,219],"binary":[88],"hash":[89,220],"codes.":[90],"core":[92],"DMFHN":[94,212,244],"lies":[95],"synergy":[98],"between":[99],"feature":[101,109,192],"optimization":[102,110],"encoder":[103,111],"bidirectional":[106,172],"GRU.":[107],"integrates":[112,197],"self-attention":[113,136],"mechanisms":[114],"depthwise":[116,148],"separable":[117,149],"convolutions":[118,150],"effectively":[120],"capture":[121],"dependencies":[124,180],"local":[126,154,161],"details":[127],"images.":[129],"Specifically,":[130],"module":[132],"first":[133],"employs":[134],"multi-head":[135],"model":[138],"contextual":[141,182],"an":[144],"image,":[145],"then":[146],"utilizes":[147],"extract":[152],"crucial":[153],"features.":[155],"By":[156],"fusing":[157],"relationships":[159],"details,":[162],"it":[163],"generates":[164],"more":[166],"expressive":[167],"image":[168,198],"representation.":[169],"Meanwhile,":[170],"GRU":[173],"enhances":[174],"textual":[175],"features":[176,217],"by":[177],"capturing":[178],"sequential":[179],"semantics":[183],"within":[184],"text.":[186],"Additionally,":[187],"we":[188],"design":[189],"fusion":[193],"strategy":[194],"that":[195,243],"dynamically":[196],"text":[200],"representations,":[201],"further":[202],"improving":[203],"expressiveness.":[206],"Through":[207],"well-optimized":[209],"function,":[211],"constrains":[213],"quantizes":[215],"multi-modal":[216],"into":[218],"codes,":[221],"ensuring":[222],"high":[223],"efficiency":[225],"while":[226],"maintaining":[227],"strong":[228],"consistency.":[231],"Finally,":[232],"experiments":[233],"conducted":[234],"on":[235],"MIRFLICKR-25K":[236],"NUS-WIDE,":[238],"two":[239],"real-world":[240],"datasets,":[241],"demonstrate":[242],"achieves":[245],"state-of-the-art":[246],"performance":[247],"retrieval,":[250],"significantly":[251],"outperforming":[252],"mainstream":[254],"methods.":[255]},"counts_by_year":[],"updated_date":"2026-01-29T23:17:01.242718","created_date":"2026-01-29T00:00:00"}
