{"id":"https://openalex.org/W4416011359","doi":"https://doi.org/10.1109/tpami.2025.3630209","title":"Dynamic Bit-Wise Semantic Transformer Hashing for Multi-Modal Retrieval","display_name":"Dynamic Bit-Wise Semantic Transformer Hashing for Multi-Modal Retrieval","publication_year":2025,"publication_date":"2025-11-07","ids":{"openalex":"https://openalex.org/W4416011359","doi":"https://doi.org/10.1109/tpami.2025.3630209","pmid":"https://pubmed.ncbi.nlm.nih.gov/41201942"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2025.3630209","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3630209","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5060463460","display_name":"Wentao Tan","orcid":"https://orcid.org/0000-0001-5907-1581"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wentao Tan","raw_affiliation_strings":["School of Computer Science and Technology, Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Fengling Li","orcid":"https://orcid.org/0000-0002-3432-6215"},"institutions":[{"id":"https://openalex.org/I114017466","display_name":"University of Technology Sydney","ror":"https://ror.org/03f0f6041","country_code":"AU","type":"education","lineage":["https://openalex.org/I114017466"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Fengling Li","raw_affiliation_strings":["Australian Artificial Intelligence Institute, Faculty of Engineering and Information Technology, University of Technology Sydney, Sydney, Australia"],"affiliations":[{"raw_affiliation_string":"Australian Artificial Intelligence Institute, Faculty of Engineering and Information Technology, University of Technology Sydney, Sydney, Australia","institution_ids":["https://openalex.org/I114017466"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Lei Zhu","orcid":"https://orcid.org/0000-0002-2993-7142"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Zhu","raw_affiliation_strings":["School of Computer Science and Technology, Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075938343","display_name":"Weili Guan","orcid":"https://orcid.org/0000-0002-5658-5509"},"institutions":[{"id":"https://openalex.org/I56590836","display_name":"Monash University","ror":"https://ror.org/02bfwt286","country_code":"AU","type":"education","lineage":["https://openalex.org/I56590836"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Weili Guan","raw_affiliation_strings":["Monash University, Clayton, VIC, Australia"],"affiliations":[{"raw_affiliation_string":"Monash University, Clayton, VIC, Australia","institution_ids":["https://openalex.org/I56590836"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100338386","display_name":"Jingjing Li","orcid":"https://orcid.org/0000-0002-5504-2529"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingjing Li","raw_affiliation_strings":["School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068843001","display_name":"Zhiyong Cheng","orcid":"https://orcid.org/0000-0003-1109-5028"},"institutions":[{"id":"https://openalex.org/I152269853","display_name":"Qilu University of Technology","ror":"https://ror.org/04hyzq608","country_code":"CN","type":"education","lineage":["https://openalex.org/I152269853"]},{"id":"https://openalex.org/I4210142748","display_name":"Shandong Academy of Sciences","ror":"https://ror.org/04y8d6y55","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiyong Cheng","raw_affiliation_strings":["Shandong Artificial Intelligence Institute, Qilu University of Technology (Shandong Academy of Sciences), Jinan, China","Shandong Artificial Intelligence Institute, Qilu University of Technology (Shandong Academy of Sciences), Jinan, Shandong, China"],"affiliations":[{"raw_affiliation_string":"Shandong Artificial Intelligence Institute, Qilu University of Technology (Shandong Academy of Sciences), Jinan, China","institution_ids":["https://openalex.org/I4210142748","https://openalex.org/I152269853"]},{"raw_affiliation_string":"Shandong Artificial Intelligence Institute, Qilu University of Technology (Shandong Academy of Sciences), Jinan, Shandong, China","institution_ids":["https://openalex.org/I4210142748","https://openalex.org/I152269853"]}]},{"author_position":"last","author":{"id":null,"display_name":"Heng Tao Shen","orcid":"https://orcid.org/0000-0002-2999-2088"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Heng Tao Shen","raw_affiliation_strings":["School of Computer Science and Technology, Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5060463460"],"corresponding_institution_ids":["https://openalex.org/I116953780"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.3274596,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"48","issue":"3","first_page":"2954","last_page":"2969"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9336000084877014,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9336000084877014,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.006300000008195639,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.003700000001117587,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hash-function","display_name":"Hash function","score":0.7976999878883362},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.57669997215271},{"id":"https://openalex.org/keywords/dynamic-perfect-hashing","display_name":"Dynamic perfect hashing","score":0.4578999876976013},{"id":"https://openalex.org/keywords/double-hashing","display_name":"Double hashing","score":0.451200008392334},{"id":"https://openalex.org/keywords/binary-code","display_name":"Binary code","score":0.4447999894618988},{"id":"https://openalex.org/keywords/universal-hashing","display_name":"Universal hashing","score":0.42489999532699585},{"id":"https://openalex.org/keywords/semantic-gap","display_name":"Semantic gap","score":0.4187000095844269},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.3944000005722046}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8109999895095825},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.7976999878883362},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.57669997215271},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49399998784065247},{"id":"https://openalex.org/C122907437","wikidata":"https://www.wikidata.org/wiki/Q5318999","display_name":"Dynamic perfect hashing","level":5,"score":0.4578999876976013},{"id":"https://openalex.org/C138111711","wikidata":"https://www.wikidata.org/wiki/Q478351","display_name":"Double hashing","level":4,"score":0.451200008392334},{"id":"https://openalex.org/C63435697","wikidata":"https://www.wikidata.org/wiki/Q864135","display_name":"Binary code","level":3,"score":0.4447999894618988},{"id":"https://openalex.org/C116058348","wikidata":"https://www.wikidata.org/wiki/Q846912","display_name":"Universal hashing","level":5,"score":0.42489999532699585},{"id":"https://openalex.org/C86034646","wikidata":"https://www.wikidata.org/wiki/Q474311","display_name":"Semantic gap","level":4,"score":0.4187000095844269},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.3944000005722046},{"id":"https://openalex.org/C67388219","wikidata":"https://www.wikidata.org/wiki/Q207440","display_name":"Hash table","level":3,"score":0.3921000063419342},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.38999998569488525},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.37779998779296875},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3767000138759613},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.37560001015663147},{"id":"https://openalex.org/C133667856","wikidata":"https://www.wikidata.org/wiki/Q5439682","display_name":"Feature hashing","level":5,"score":0.3587999939918518},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3231000006198883},{"id":"https://openalex.org/C77660490","wikidata":"https://www.wikidata.org/wiki/Q244916","display_name":"Intermediate language","level":3,"score":0.30090001225471497},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2962999939918518},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.29100000858306885},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.29089999198913574},{"id":"https://openalex.org/C2778180026","wikidata":"https://www.wikidata.org/wiki/Q18378163","display_name":"Semantic heterogeneity","level":4,"score":0.2865999937057495},{"id":"https://openalex.org/C36375716","wikidata":"https://www.wikidata.org/wiki/Q6553456","display_name":"Linear hashing","level":5,"score":0.28029999136924744},{"id":"https://openalex.org/C2775955345","wikidata":"https://www.wikidata.org/wiki/Q7449071","display_name":"Semantic mapping","level":2,"score":0.26409998536109924},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.25940001010894775},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.2551000118255615}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2025.3630209","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3630209","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:41201942","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41201942","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":60,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W2007972815","https://openalex.org/W2015175493","https://openalex.org/W2025432722","https://openalex.org/W2039208785","https://openalex.org/W2053186076","https://openalex.org/W2086958058","https://openalex.org/W2087193308","https://openalex.org/W2093932377","https://openalex.org/W2167451801","https://openalex.org/W2170942078","https://openalex.org/W2266728343","https://openalex.org/W2411707397","https://openalex.org/W2493727926","https://openalex.org/W2620123979","https://openalex.org/W2747853580","https://openalex.org/W2765440071","https://openalex.org/W2781821509","https://openalex.org/W2802864907","https://openalex.org/W2805087257","https://openalex.org/W2896457183","https://openalex.org/W2904458925","https://openalex.org/W2940532918","https://openalex.org/W2955273087","https://openalex.org/W2963540428","https://openalex.org/W2967957126","https://openalex.org/W2981076146","https://openalex.org/W2982065678","https://openalex.org/W2994818707","https://openalex.org/W3006683596","https://openalex.org/W3006871679","https://openalex.org/W3008014442","https://openalex.org/W3011911986","https://openalex.org/W3028385587","https://openalex.org/W3035747010","https://openalex.org/W3096609285","https://openalex.org/W3103671489","https://openalex.org/W3113055207","https://openalex.org/W3159460504","https://openalex.org/W3173956867","https://openalex.org/W3201835075","https://openalex.org/W3207267030","https://openalex.org/W4200200221","https://openalex.org/W4213019189","https://openalex.org/W4282937884","https://openalex.org/W4284687590","https://openalex.org/W4285242239","https://openalex.org/W4304092731","https://openalex.org/W4312477797","https://openalex.org/W4317496691","https://openalex.org/W4360884927","https://openalex.org/W4379382581","https://openalex.org/W4383900188","https://openalex.org/W4385245566","https://openalex.org/W4387969056","https://openalex.org/W4388189902","https://openalex.org/W4388191759","https://openalex.org/W4392172801","https://openalex.org/W4396712913","https://openalex.org/W4400033078"],"related_works":[],"abstract_inverted_index":{"Multi-modal":[0],"hashing":[1,243],"aims":[2],"to":[3,164,191,237],"succinctly":[4],"encode":[5],"heterogeneous":[6,43,124],"modalities":[7],"into":[8],"binary":[9,79],"hash":[10,68,72,113,194,234],"codes,":[11],"facilitating":[12,120,151,257],"efficient":[13],"multimedia":[14],"retrieval":[15,23,272,285],"characterized":[16],"by":[17,168],"low":[18],"storage":[19],"demands":[20],"and":[21,51,59,130,181,231,283],"high":[22],"speed.":[24],"Despite":[25],"the":[26,42,63,101,143,152,178,184,218,239,242,258,275],"commendable":[27],"achievements":[28],"of":[29,41,56,67,78,123,146,154,220,241,260,277],"existing":[30],"methods,":[31],"they":[32],"still":[33],"face":[34],"three":[35,268],"crucial":[36],"challenges:":[37],"1)":[38],"Inadequate":[39],"bridging":[40],"modality":[44],"gap":[45],"through":[46,217],"coarse,":[47],"global":[48],"feature-level":[49,71],"alignment":[50,122,180],"fusion.":[52],"2)":[53],"The":[54,76],"erosion":[55],"bit":[57,114,128],"independence":[58,129],"consequent":[60],"limitations":[61],"on":[62,183,267],"semantic":[64,82,89,118,156,229,262],"representation":[65,132],"capacity":[66],"codes":[69],"during":[70],"code":[73],"learning.":[74],"3)":[75],"insufficiency":[77],"label-based":[80],"pairwise":[81],"preservation":[83],"strategies":[84],"in":[85,245,280],"capturing":[86],"intricate":[87],"fine-grained":[88,185,227],"correlations":[90,171,230],"within":[91],"multi-modal":[92,148,179,248,271],"data.":[93],"To":[94,196],"address":[95],"these":[96,166],"challenges,":[97],"this":[98],"paper":[99],"introduces":[100],"Dynamic":[102],"Bit-wise":[103],"Semantic":[104],"Transformer":[105],"Hashing":[106],"(DBSTH)":[107],"framework.":[108],"Remarkably,":[109],"it":[110],"treats":[111],"each":[112,189],"as":[115],"a":[116,137,161,203,250],"unique":[117],"concept,":[119],"concept-level":[121],"modalities.":[125],"This":[126,223],"safeguards":[127],"augments":[131],"capabilities.":[133],"Specifically,":[134],"we":[135,159,176],"devise":[136],"dynamic":[138],"unit":[139],"fusion":[140,182],"strategy":[141,254],"for":[142,200,214],"adaptive":[144],"combination":[145],"local":[147],"information":[149],"units,":[150],"acquisition":[153,259],"bit-wise":[155],"concepts.":[157,174,263],"Subsequently,":[158],"incorporate":[160],"transformer":[162],"encoder":[163],"refine":[165],"concepts":[167],"uncovering":[169],"latent":[170],"among":[172],"distinct":[173],"Finally,":[175],"perform":[177],"concept-level,":[186],"independently":[187],"encoding":[188],"concept":[190,201,252],"its":[192],"corresponding":[193],"bit.":[195],"provide":[197],"enhanced":[198],"guidance":[199],"learning,":[202],"label":[204],"prototype":[205,212],"learning":[206,253],"mechanism":[207,224],"is":[208,255],"introduced,":[209,256],"which":[210],"learns":[211],"embeddings":[213],"all":[215],"categories":[216],"consideration":[219],"co-occurrence":[221],"priors.":[222],"effectively":[225],"captures":[226],"explicit":[228],"generates":[232],"supervising":[233],"codes.":[235],"Additionally,":[236],"improve":[238],"robustness":[240],"model":[244],"handling":[246],"noisy":[247],"data,":[249],"masked":[251],"resilient":[261],"Extensive":[264],"experiments":[265],"conducted":[266],"widely":[269],"tested":[270],"datasets":[273],"demonstrate":[274],"superiority":[276],"our":[278],"method":[279],"conventional,":[281],"noisy,":[282],"open-set":[284],"scenarios.":[286]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-11-07T00:00:00"}
