{"id":"https://openalex.org/W7129054858","doi":"https://doi.org/10.48550/arxiv.2602.12936","title":"Unleashing MLLMs on the Edge: A Unified Framework for Cross-Modal ReID via Adaptive SVD Distillation","display_name":"Unleashing MLLMs on the Edge: A Unified Framework for Cross-Modal ReID via Adaptive SVD Distillation","publication_year":2026,"publication_date":"2026-02-13","ids":{"openalex":"https://openalex.org/W7129054858","doi":"https://doi.org/10.48550/arxiv.2602.12936"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.12936","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126098306","display_name":"Hongbo Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jiang, Hongbo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126161740","display_name":"Jie Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Jie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126164758","display_name":"Xinqi Cai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cai, Xinqi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126122806","display_name":"Tianyu Xie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xie, Tianyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126087636","display_name":"Yunhang Shen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Yunhang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032612432","display_name":"Pingyang Dai","orcid":"https://orcid.org/0000-0001-9780-271X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dai, Pingyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5126083256","display_name":"Liujuan Cao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Liujuan","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5126098306"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.36169999837875366,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.36169999837875366,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.2603999972343445,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.04749999940395355,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6071000099182129},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.5792999863624573},{"id":"https://openalex.org/keywords/unification","display_name":"Unification","score":0.5616999864578247},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.5205000042915344},{"id":"https://openalex.org/keywords/relation","display_name":"Relation (database)","score":0.4683000147342682},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.4659000039100647},{"id":"https://openalex.org/keywords/unified-model","display_name":"Unified Model","score":0.46480000019073486},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.43220001459121704},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.41119998693466187},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.4027000069618225}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7601000070571899},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6071000099182129},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.5792999863624573},{"id":"https://openalex.org/C96146094","wikidata":"https://www.wikidata.org/wiki/Q609057","display_name":"Unification","level":2,"score":0.5616999864578247},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.5205000042915344},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.4683000147342682},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.4659000039100647},{"id":"https://openalex.org/C45493050","wikidata":"https://www.wikidata.org/wiki/Q7884934","display_name":"Unified Model","level":2,"score":0.46480000019073486},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45210000872612},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.43220001459121704},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.41119998693466187},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4043000042438507},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.4027000069618225},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3758000135421753},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.37290000915527344},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.35690000653266907},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3422999978065491},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.3391000032424927},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.3077000081539154},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.3070000112056732},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.30480000376701355},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.30390000343322754},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.30059999227523804},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.2953999936580658},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2937000095844269},{"id":"https://openalex.org/C171018156","wikidata":"https://www.wikidata.org/wiki/Q7370306","display_name":"Rotation formalisms in three dimensions","level":2,"score":0.2928999960422516},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.27900001406669617},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.2750000059604645},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.2727999985218048},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.262800008058548},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.26190000772476196},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.258899986743927},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.257999986410141}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.12936","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.12936","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.12936","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.12936","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Practical":[0],"cloud-edge":[1,66],"deployment":[2],"of":[3,15],"Cross-Modal":[4],"Re-identification":[5],"(CM-ReID)":[6],"faces":[7],"challenges":[8],"due":[9],"to":[10,35,83,122],"maintaining":[11],"a":[12,39,59,64,71,75,89,107,116,132,153,164,194],"fragmented":[13],"ecosystem":[14],"specialized":[16],"cloud":[17,77],"models":[18,210],"for":[19,49,199],"diverse":[20],"modalities.":[21,99],"While":[22],"Multi-Modal":[23],"Large":[24],"Language":[25],"Models":[26],"(MLLMs)":[27],"offer":[28],"strong":[29],"unification":[30],"potential,":[31],"existing":[32],"approaches":[33],"fail":[34],"adapt":[36,70],"them":[37],"into":[38,74],"single":[40],"end-to-end":[41],"backbone":[42],"and":[43,97,196,209],"lack":[44],"effective":[45,197],"knowledge":[46,125],"distillation":[47,134],"strategies":[48],"edge":[50],"deployment.":[51],"To":[52,146],"address":[53],"these":[54],"limitations,":[55],"we":[56,69,130],"propose":[57],"MLLMEmbed-ReID,":[58],"unified":[60,90,201],"framework":[61,191],"based":[62],"on":[63,175,204],"powerful":[65],"architecture.":[67],"First,":[68],"foundational":[72],"MLLM":[73,86],"state-of-the-art":[76,173],"model.":[78],"We":[79],"leverage":[80],"instruction-based":[81],"prompting":[82],"guide":[84],"the":[85,138,142],"in":[87,141],"generating":[88],"embedding":[91],"space":[92],"across":[93,185],"RGB,":[94],"infrared,":[95],"sketch,":[96],"text":[98],"This":[100],"model":[101,171],"is":[102],"then":[103],"trained":[104],"efficiently":[105],"with":[106],"hierarchical":[108],"Low-Rank":[109],"Adaptation":[110],"finetuning":[111],"(LoRA-SFT)":[112],"strategy,":[113],"optimized":[114],"under":[115],"holistic":[117],"cross-modal":[118],"alignment":[119],"objective.":[120],"Second,":[121],"deploy":[123],"its":[124,181],"onto":[126],"an":[127],"edge-native":[128],"student,":[129],"introduce":[131],"novel":[133],"strategy":[135],"motivated":[136],"by":[137],"low-rank":[139],"property":[140],"teacher's":[143],"feature":[144],"space.":[145],"prioritize":[147],"essential":[148],"information,":[149],"this":[150],"method":[151],"employs":[152],"Principal":[154],"Component":[155],"Mapping":[156],"loss,":[157],"while":[158,180],"relational":[159],"structures":[160],"are":[161],"preserved":[162],"via":[163],"Feature":[165],"Relation":[166],"loss.":[167],"Our":[168],"lightweight":[169],"edge-based":[170],"achieves":[172],"performance":[174],"multiple":[176],"visual":[177],"CM-ReID":[178,187],"benchmarks,":[179],"cloud-based":[182],"counterpart":[183],"excels":[184],"all":[186],"benchmarks.":[188],"The":[189,207],"MLLMEmbed-ReID":[190],"thus":[192],"presents":[193],"complete":[195],"solution":[198],"deploying":[200],"MLLM-level":[202],"intelligence":[203],"resource-constrained":[205],"devices.":[206],"code":[208],"will":[211],"be":[212],"open-sourced":[213],"soon.":[214]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-17T00:00:00"}
