{"id":"https://openalex.org/W4408930147","doi":"https://doi.org/10.1145/3726528","title":"Learning Visual-Semantic Embedding for Generalizable Person Re-Identification: A Unified Perspective","display_name":"Learning Visual-Semantic Embedding for Generalizable Person Re-Identification: A Unified Perspective","publication_year":2025,"publication_date":"2025-03-28","ids":{"openalex":"https://openalex.org/W4408930147","doi":"https://doi.org/10.1145/3726528"},"language":"en","primary_location":{"id":"doi:10.1145/3726528","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3726528","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3726528","source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3726528","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027871520","display_name":"Suncheng Xiang","orcid":"https://orcid.org/0000-0002-9141-6460"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Suncheng Xiang","raw_affiliation_strings":["School of Biomedical Engineering, Shanghai Jiao Tong University, Shanghai, China","School of Biomedical Engineering, Shanghai Jiao Tong University, China"],"raw_orcid":"https://orcid.org/0000-0002-9141-6460","affiliations":[{"raw_affiliation_string":"School of Biomedical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"School of Biomedical Engineering, Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026260510","display_name":"Jingsheng Gao","orcid":"https://orcid.org/0000-0001-6271-0903"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingsheng Gao","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, China"],"raw_orcid":"https://orcid.org/0000-0001-6271-0903","affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076218215","display_name":"Mingye Xie","orcid":"https://orcid.org/0000-0001-9826-9806"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingye Xie","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, China"],"raw_orcid":"https://orcid.org/0000-0001-9826-9806","affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088135786","display_name":"Mengyuan Guan","orcid":"https://orcid.org/0000-0001-7327-0608"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mengyuan Guan","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, China"],"raw_orcid":"https://orcid.org/0000-0001-7327-0608","affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114416551","display_name":"Jiacheng Ruan","orcid":"https://orcid.org/0000-0001-5469-507X"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiacheng Ruan","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, China"],"raw_orcid":"https://orcid.org/0000-0001-5469-507X","affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101704886","display_name":"Yuzhuo Fu","orcid":"https://orcid.org/0000-0001-5516-3016"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuzhuo Fu","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, China"],"raw_orcid":"https://orcid.org/0000-0001-5516-3016","affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5027871520"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":3.3997,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.91719848,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":"21","issue":"10","first_page":"1","last_page":"17"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12740","display_name":"Gait Recognition and Analysis","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8815435171127319},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.7198623418807983},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.6394805908203125},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6163995265960693},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.537783682346344},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.47112321853637695},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.46608230471611023},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3954576849937439},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.33575719594955444}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8815435171127319},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.7198623418807983},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.6394805908203125},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6163995265960693},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.537783682346344},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.47112321853637695},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.46608230471611023},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3954576849937439},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.33575719594955444},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3726528","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3726528","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3726528","source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3726528","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3726528","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3726528","source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2362817167","display_name":null,"funder_award_id":"62301315","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4408930147.pdf"},"referenced_works_count":36,"referenced_works":["https://openalex.org/W1949591461","https://openalex.org/W1971955426","https://openalex.org/W1982925187","https://openalex.org/W2069065514","https://openalex.org/W2186222003","https://openalex.org/W2204750386","https://openalex.org/W2584637367","https://openalex.org/W2962858109","https://openalex.org/W2963000559","https://openalex.org/W2963043696","https://openalex.org/W2963047834","https://openalex.org/W2963449390","https://openalex.org/W2963557071","https://openalex.org/W2963975998","https://openalex.org/W2967515867","https://openalex.org/W3081136368","https://openalex.org/W3098711604","https://openalex.org/W3148011420","https://openalex.org/W3155080005","https://openalex.org/W3174702195","https://openalex.org/W3206322224","https://openalex.org/W3208382980","https://openalex.org/W3213438015","https://openalex.org/W4214540501","https://openalex.org/W4214736485","https://openalex.org/W4220757105","https://openalex.org/W4236965008","https://openalex.org/W4281749424","https://openalex.org/W4293211937","https://openalex.org/W4301409532","https://openalex.org/W4304091756","https://openalex.org/W4327950385","https://openalex.org/W4383314927","https://openalex.org/W4384820933","https://openalex.org/W4387698360","https://openalex.org/W4393156091"],"related_works":["https://openalex.org/W2899084033","https://openalex.org/W2081900870","https://openalex.org/W2018871932","https://openalex.org/W641279757","https://openalex.org/W370975646","https://openalex.org/W1670566515","https://openalex.org/W4242022592","https://openalex.org/W596972243","https://openalex.org/W2149537132","https://openalex.org/W2037549926"],"abstract_inverted_index":{"Generalizable":[0],"person":[1,138],"Re-Identification":[2],"(Re-ID)":[3],"is":[4,110,170],"a":[5,18,74,100],"very":[6],"hot":[7],"research":[8,162],"topic":[9],"in":[10,21,29,95],"machine":[11],"learning":[12,84,94],"and":[13,32,118,131],"computer":[14],"vision,":[15],"which":[16,56,122],"plays":[17],"significant":[19],"role":[20],"realistic":[22],"scenarios":[23],"due":[24],"to":[25,47,59,65,112],"its":[26],"various":[27],"applications":[28],"public":[30],"security":[31],"video":[33],"surveillance.":[34],"However,":[35],"previous":[36,153],"methods":[37],"mainly":[38],"focus":[39],"on":[40,85,126,142],"the":[41,49,66,91,96,115,119,134,146,161],"visual":[42],"representation":[43,165],"learning,":[44],"while":[45],"neglect":[46],"explore":[48],"potential":[50],"of":[51,98,136,149],"semantic":[52],"features":[53],"during":[54],"training,":[55],"easily":[57],"leads":[58],"poor":[60],"generalization":[61],"capability":[62],"when":[63],"adapted":[64],"new":[67],"domain.":[68],"In":[69],"this":[70,157],"article,":[71],"we":[72],"present":[73],"unified":[75],"perspective":[76],"called":[77,104],"MMET":[78],"for":[79],"more":[80],"robust":[81,92],"visual-semantic":[82,164],"embedding":[83],"generalizable":[86,137],"Re-ID.":[87,139],"To":[88],"further":[89],"enhance":[90],"feature":[93],"context":[97],"transformer,":[99],"dynamic":[101],"masking":[102],"mechanism":[103],"Masked":[105],"Multimodal":[106],"Modeling":[107],"(MMM)":[108],"strategy":[109],"introduced":[111],"mask":[113],"both":[114],"image":[116],"patches":[117],"text":[120],"tokens,":[121],"can":[123],"jointly":[124],"work":[125],"multimodal":[127],"or":[128],"unimodal":[129],"data":[130],"significantly":[132],"boost":[133],"performance":[135,148],"Extensive":[140],"experiments":[141],"benchmark":[143],"datasets":[144],"demonstrate":[145],"competitive":[147],"our":[150],"method":[151,158],"over":[152],"approaches.":[154],"We":[155],"hope":[156],"could":[159],"advance":[160],"towards":[163],"learning.":[166],"Our":[167],"source":[168],"code":[169],"also":[171],"publicly":[172],"available":[173],"at":[174],"https://github.com/JeremyXSC/MMET":[175],".":[176]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
