{"id":"https://openalex.org/W4415747953","doi":"https://doi.org/10.1109/tmc.2025.3626724","title":"Task-Oriented Feature Compression for Multimodal Understanding via Device-Edge Co-Inference","display_name":"Task-Oriented Feature Compression for Multimodal Understanding via Device-Edge Co-Inference","publication_year":2025,"publication_date":"2025-10-31","ids":{"openalex":"https://openalex.org/W4415747953","doi":"https://doi.org/10.1109/tmc.2025.3626724"},"language":"en","primary_location":{"id":"doi:10.1109/tmc.2025.3626724","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmc.2025.3626724","pdf_url":null,"source":{"id":"https://openalex.org/S69141925","display_name":"IEEE Transactions on Mobile Computing","issn_l":"1536-1233","issn":["1536-1233","1558-0660","2161-9875"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Mobile Computing","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2503.12926","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045620060","display_name":"Cheng Yuan","orcid":"https://orcid.org/0009-0003-5086-3066"},"institutions":[{"id":"https://openalex.org/I4210136246","display_name":"China Telecom (China)","ror":"https://ror.org/03jgnzt20","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210136246"]},{"id":"https://openalex.org/I4387153335","display_name":"China Telecom","ror":"https://ror.org/05p67dv18","country_code":null,"type":"company","lineage":["https://openalex.org/I4387153335"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cheng Yuan","raw_affiliation_strings":["Institute of Artificial Intelligence (TeleAI) of China Telecom, Beijing, China","Institute of Artificial Intelligence (TeleAI) of China Telecom, China"],"raw_orcid":"https://orcid.org/0009-0003-5086-3066","affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence (TeleAI) of China Telecom, Beijing, China","institution_ids":["https://openalex.org/I4210136246","https://openalex.org/I4387153335"]},{"raw_affiliation_string":"Institute of Artificial Intelligence (TeleAI) of China Telecom, China","institution_ids":["https://openalex.org/I4210136246","https://openalex.org/I4387153335"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050006234","display_name":"Zhening Liu","orcid":"https://orcid.org/0009-0001-6502-368X"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Zhening Liu","raw_affiliation_strings":["Department of Electronic and Computer Engineering, Hong Kong University of Science and Technology, Hong Kong"],"raw_orcid":"https://orcid.org/0009-0001-6502-368X","affiliations":[{"raw_affiliation_string":"Department of Electronic and Computer Engineering, Hong Kong University of Science and Technology, Hong Kong","institution_ids":["https://openalex.org/I200769079"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jiashu Lv","orcid":"https://orcid.org/0009-0009-4157-3108"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiashu Lv","raw_affiliation_strings":["School of Software and Microelectronics, Peking University, Beijing, China","School of Software and Microelectronics, Peking University, China"],"raw_orcid":"https://orcid.org/0009-0009-4157-3108","affiliations":[{"raw_affiliation_string":"School of Software and Microelectronics, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"School of Software and Microelectronics, Peking University, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102806605","display_name":"Jiawei Shao","orcid":"https://orcid.org/0000-0001-8836-1430"},"institutions":[{"id":"https://openalex.org/I4210136246","display_name":"China Telecom (China)","ror":"https://ror.org/03jgnzt20","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210136246"]},{"id":"https://openalex.org/I4387153335","display_name":"China Telecom","ror":"https://ror.org/05p67dv18","country_code":null,"type":"company","lineage":["https://openalex.org/I4387153335"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiawei Shao","raw_affiliation_strings":["Institute of Artificial Intelligence (TeleAI) of China Telecom, Beijing, China","Institute of Artificial Intelligence (TeleAI) of China Telecom, China"],"raw_orcid":"https://orcid.org/0000-0001-8836-1430","affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence (TeleAI) of China Telecom, Beijing, China","institution_ids":["https://openalex.org/I4210136246","https://openalex.org/I4387153335"]},{"raw_affiliation_string":"Institute of Artificial Intelligence (TeleAI) of China Telecom, China","institution_ids":["https://openalex.org/I4210136246","https://openalex.org/I4387153335"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071060953","display_name":"Yufei Jiang","orcid":"https://orcid.org/0000-0003-0523-8117"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yufei Jiang","raw_affiliation_strings":["School of Electronic and Information Engineering, Harbin Institute of Technology, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0003-0523-8117","affiliations":[{"raw_affiliation_string":"School of Electronic and Information Engineering, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100433167","display_name":"Jun Zhang","orcid":"https://orcid.org/0000-0002-5222-1898"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Jun Zhang","raw_affiliation_strings":["Department of Electronic and Computer Engineering, Hong Kong University of Science and Technology, Hong Kong"],"raw_orcid":"https://orcid.org/0000-0002-5222-1898","affiliations":[{"raw_affiliation_string":"Department of Electronic and Computer Engineering, Hong Kong University of Science and Technology, Hong Kong","institution_ids":["https://openalex.org/I200769079"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5106943753","display_name":"Xuelong Li","orcid":"https://orcid.org/0000-0003-2924-946X"},"institutions":[{"id":"https://openalex.org/I4210136246","display_name":"China Telecom (China)","ror":"https://ror.org/03jgnzt20","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210136246"]},{"id":"https://openalex.org/I4387153335","display_name":"China Telecom","ror":"https://ror.org/05p67dv18","country_code":null,"type":"company","lineage":["https://openalex.org/I4387153335"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuelong Li","raw_affiliation_strings":["Institute of Artificial Intelligence (TeleAI) of China Telecom, Beijing, China","Institute of Artificial Intelligence (TeleAI) of China Telecom, China"],"raw_orcid":"https://orcid.org/0000-0003-2924-946X","affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence (TeleAI) of China Telecom, Beijing, China","institution_ids":["https://openalex.org/I4210136246","https://openalex.org/I4387153335"]},{"raw_affiliation_string":"Institute of Artificial Intelligence (TeleAI) of China Telecom, China","institution_ids":["https://openalex.org/I4210136246","https://openalex.org/I4387153335"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.9349,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.80574396,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":"25","issue":"4","first_page":"4762","last_page":"4775"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9519000053405762,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9519000053405762,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.006899999920278788,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.005900000222027302,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5990999937057495},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.5216000080108643},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4936000108718872},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.49230000376701355},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.4839000105857849},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.39800000190734863},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3955000042915344},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.36390000581741333},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.3555000126361847}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8622000217437744},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5990999937057495},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.5216000080108643},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5062000155448914},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4936000108718872},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.49230000376701355},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.4839000105857849},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.39800000190734863},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3955000042915344},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.36390000581741333},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.3555000126361847},{"id":"https://openalex.org/C81081738","wikidata":"https://www.wikidata.org/wiki/Q55542","display_name":"Lossless compression","level":3,"score":0.3440000116825104},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.33250001072883606},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.32910001277923584},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.3276999890804291},{"id":"https://openalex.org/C160086991","wikidata":"https://www.wikidata.org/wiki/Q5939193","display_name":"Human visual system model","level":3,"score":0.32760000228881836},{"id":"https://openalex.org/C13481523","wikidata":"https://www.wikidata.org/wiki/Q412438","display_name":"Image compression","level":4,"score":0.3100000023841858},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.30230000615119934},{"id":"https://openalex.org/C1769480","wikidata":"https://www.wikidata.org/wiki/Q1345239","display_name":"Entropy encoding","level":3,"score":0.2980000078678131},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2964000105857849},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.29120001196861267},{"id":"https://openalex.org/C557945733","wikidata":"https://www.wikidata.org/wiki/Q389772","display_name":"Data transmission","level":2,"score":0.28290000557899475},{"id":"https://openalex.org/C2778456923","wikidata":"https://www.wikidata.org/wiki/Q5337692","display_name":"Edge computing","level":3,"score":0.28040000796318054},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2687999904155731},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.26179999113082886},{"id":"https://openalex.org/C46637626","wikidata":"https://www.wikidata.org/wiki/Q6693015","display_name":"Low latency (capital markets)","level":2,"score":0.2612000107765198},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.2556000053882599}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tmc.2025.3626724","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmc.2025.3626724","pdf_url":null,"source":{"id":"https://openalex.org/S69141925","display_name":"IEEE Transactions on Mobile Computing","issn_l":"1536-1233","issn":["1536-1233","1558-0660","2161-9875"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Mobile Computing","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2503.12926","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2503.12926","pdf_url":"https://arxiv.org/pdf/2503.12926","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-167270","is_oa":false,"landing_page_url":"http://repository.hkust.edu.hk/ir/Record/1783.1-167270","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2503.12926","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2503.12926","pdf_url":"https://arxiv.org/pdf/2503.12926","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"With":[0],"the":[1,27,34,66,135,179,182,191,203,206],"rapid":[2],"development":[3],"of":[4,57,69,137,181,190,205],"large":[5],"multimodal":[6,9,93],"models":[7,173],"(LMMs),":[8],"understanding":[10,94],"applications":[11],"are":[12,103,174],"emerging.":[13],"As":[14],"most":[15],"LMM":[16],"inference":[17,29],"requests":[18],"originate":[19],"from":[20],"edge":[21,39,58],"devices":[22,59],"with":[23,153,235],"limited":[24,54],"computational":[25,146],"capabilities,":[26],"predominant":[28],"pipeline":[30],"involves":[31],"directly":[32],"forwarding":[33],"input":[35],"data":[36,143,220],"to":[37,53,133,157,216],"an":[38],"server":[40],"which":[41],"handles":[42],"all":[43],"computations.":[44],"However,":[45],"this":[46,82],"approach":[47],"introduces":[48],"high":[49],"transmission":[50,144,165,221],"latency":[51,63,228],"due":[52],"uplink":[55],"bandwidth":[56],"and":[60,76,107,112,145,159,223],"significant":[61],"computation":[62],"caused":[64],"by":[65,105,109],"prohibitive":[67],"number":[68,136],"visual":[70,101,138,183,198],"tokens,":[71],"thus":[72],"hindering":[73],"delay-sensitive":[74],"tasks":[75],"degrading":[77],"user":[78],"experience.":[79],"To":[80,167],"address":[81],"challenge,":[83],"we":[84,120],"propose":[85],"a":[86,96,110,149,186],"task-oriented":[87],"feature":[88,117],"compression":[89,169,237],"(TOFC)":[90],"method":[91],"for":[92],"in":[95,219,226],"device-edge":[97],"co-inference":[98],"framework,":[99],"where":[100],"features":[102],"merged":[104,161],"clustering":[106,124],"encoded":[108],"learnable":[111,150],"selective":[113],"entropy":[114,151,172],"model":[115,152],"before":[116],"projection.":[118],"Specifically,":[119],"employ":[121],"density":[122],"peaks":[123],"based":[125,177],"on":[126,178,196],"<inline-formula":[127],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[128],"xmlns:xlink=\"http://www.w3.org/1999/xlink\"><tex-math":[129],"notation=\"LaTeX\">$K$</tex-math></inline-formula>":[130],"nearest":[131],"neighbors":[132],"reduce":[134],"features,":[139,162,184],"thereby":[140],"minimizing":[141],"both":[142],"complexity.":[147],"Subsequently,":[148],"hyperprior":[154],"is":[155],"utilized":[156],"encode":[158],"decode":[160],"further":[163],"reducing":[164],"overhead.":[166],"enhance":[168],"efficiency,":[170],"multiple":[171],"adaptively":[175],"selected":[176],"characteristics":[180],"enabling":[185],"more":[187],"accurate":[188],"estimation":[189],"probability":[192],"distribution.":[193],"Comprehensive":[194],"experiments":[195],"seven":[197],"question":[199],"answering":[200],"benchmarks":[201],"validate":[202],"effectiveness":[204],"proposed":[207],"TOFC":[208,213],"method.":[209],"Results":[210],"show":[211],"that":[212],"achieves":[214],"up":[215],"52%":[217],"reduction":[218,225],"overhead":[222],"63%":[224],"system":[227],"while":[229],"maintaining":[230],"identical":[231],"task":[232],"performance,":[233],"compared":[234],"neural":[236],"ELIC.":[238]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-31T00:00:00"}
