{"id":"https://openalex.org/W3174995126","doi":"https://doi.org/10.1145/3477083.3480150","title":"Towards memory-efficient inference in edge video analytics","display_name":"Towards memory-efficient inference in edge video analytics","publication_year":2021,"publication_date":"2021-10-08","ids":{"openalex":"https://openalex.org/W3174995126","doi":"https://doi.org/10.1145/3477083.3480150","mag":"3174995126"},"language":"en","primary_location":{"id":"doi:10.1145/3477083.3480150","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3477083.3480150","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3477083.3480150","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 3rd ACM Workshop on Hot Topics in Video Analytics and Intelligent Edges","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3477083.3480150","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069421494","display_name":"Arthi Padmanabhan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210135422","display_name":"Microsoft (Norway)","ror":"https://ror.org/03jtz4s80","country_code":"NO","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210135422"]}],"countries":["NO"],"is_corresponding":true,"raw_author_name":"Arthi Padmanabhan","raw_affiliation_strings":["Microsoft &amp; UCLA"],"affiliations":[{"raw_affiliation_string":"Microsoft &amp; UCLA","institution_ids":["https://openalex.org/I4210135422"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090733623","display_name":"Anand Iyer","orcid":"https://orcid.org/0009-0009-3700-2994"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Anand Padmanabha Iyer","raw_affiliation_strings":["Microsoft Research"],"affiliations":[{"raw_affiliation_string":"Microsoft Research","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031071237","display_name":"Ganesh Ananthanarayanan","orcid":"https://orcid.org/0000-0002-7479-1664"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Ganesh Ananthanarayanan","raw_affiliation_strings":["Microsoft Research"],"affiliations":[{"raw_affiliation_string":"Microsoft Research","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016472874","display_name":"Yuanchao Shu","orcid":"https://orcid.org/0000-0002-9542-7095"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Yuanchao Shu","raw_affiliation_strings":["Microsoft Research"],"affiliations":[{"raw_affiliation_string":"Microsoft Research","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076846509","display_name":"Nikolaos Karianakis","orcid":null},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Nikolaos Karianakis","raw_affiliation_strings":["Microsoft Research"],"affiliations":[{"raw_affiliation_string":"Microsoft Research","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101967307","display_name":"Guoqing Xu","orcid":"https://orcid.org/0000-0003-4737-2146"},"institutions":[{"id":"https://openalex.org/I2799798094","display_name":"UCLA Health","ror":"https://ror.org/01d88se56","country_code":"US","type":"funder","lineage":["https://openalex.org/I2799798094"]},{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB","US"],"is_corresponding":false,"raw_author_name":"Guoqing Harry Xu","raw_affiliation_strings":["UCLA","Microsoft Research"],"affiliations":[{"raw_affiliation_string":"UCLA","institution_ids":["https://openalex.org/I2799798094"]},{"raw_affiliation_string":"Microsoft Research","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053593890","display_name":"Ravi Netravali","orcid":"https://orcid.org/0000-0001-7002-5033"},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ravi Netravali","raw_affiliation_strings":["Princeton University"],"affiliations":[{"raw_affiliation_string":"Princeton University","institution_ids":["https://openalex.org/I20089843"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5069421494"],"corresponding_institution_ids":["https://openalex.org/I4210135422"],"apc_list":null,"apc_paid":null,"fwci":0.6725,"has_fulltext":true,"cited_by_count":8,"citation_normalized_percentile":{"value":0.70813725,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"31","last_page":"37"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8528034687042236},{"id":"https://openalex.org/keywords/server","display_name":"Server","score":0.746710479259491},{"id":"https://openalex.org/keywords/analytics","display_name":"Analytics","score":0.611518383026123},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.6027406454086304},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5406704545021057},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.5001108646392822},{"id":"https://openalex.org/keywords/memory-management","display_name":"Memory management","score":0.4785250425338745},{"id":"https://openalex.org/keywords/edge-computing","display_name":"Edge computing","score":0.47540196776390076},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.4639344811439514},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.4181613028049469},{"id":"https://openalex.org/keywords/edge-device","display_name":"Edge device","score":0.4148673713207245},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.38041362166404724},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.37523549795150757},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.23885783553123474},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.21264132857322693},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1423637866973877},{"id":"https://openalex.org/keywords/semiconductor-memory","display_name":"Semiconductor memory","score":0.13405081629753113},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.10630926489830017}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8528034687042236},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.746710479259491},{"id":"https://openalex.org/C79158427","wikidata":"https://www.wikidata.org/wiki/Q485396","display_name":"Analytics","level":2,"score":0.611518383026123},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.6027406454086304},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5406704545021057},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.5001108646392822},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.4785250425338745},{"id":"https://openalex.org/C2778456923","wikidata":"https://www.wikidata.org/wiki/Q5337692","display_name":"Edge computing","level":3,"score":0.47540196776390076},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.4639344811439514},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.4181613028049469},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.4148673713207245},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.38041362166404724},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.37523549795150757},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.23885783553123474},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.21264132857322693},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1423637866973877},{"id":"https://openalex.org/C98986596","wikidata":"https://www.wikidata.org/wiki/Q1143031","display_name":"Semiconductor memory","level":2,"score":0.13405081629753113},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.10630926489830017},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3477083.3480150","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3477083.3480150","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3477083.3480150","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 3rd ACM Workshop on Hot Topics in Video Analytics and Intelligent Edges","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3477083.3480150","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3477083.3480150","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3477083.3480150","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 3rd ACM Workshop on Hot Topics in Video Analytics and Intelligent Edges","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3174995126.pdf","grobid_xml":"https://content.openalex.org/works/W3174995126.grobid-xml"},"referenced_works_count":27,"referenced_works":["https://openalex.org/W1475617732","https://openalex.org/W1934410531","https://openalex.org/W2086402015","https://openalex.org/W2565639579","https://openalex.org/W2599765304","https://openalex.org/W2752236330","https://openalex.org/W2767011558","https://openalex.org/W2809420642","https://openalex.org/W2885829265","https://openalex.org/W2896225285","https://openalex.org/W2899071864","https://openalex.org/W2910100551","https://openalex.org/W2913340405","https://openalex.org/W2946920775","https://openalex.org/W2962677625","https://openalex.org/W2963510045","https://openalex.org/W2971843695","https://openalex.org/W2972871493","https://openalex.org/W2986646794","https://openalex.org/W2999418247","https://openalex.org/W3012121966","https://openalex.org/W3012479151","https://openalex.org/W3046256272","https://openalex.org/W3080230561","https://openalex.org/W6600281463","https://openalex.org/W6608099265","https://openalex.org/W6679215085"],"related_works":["https://openalex.org/W3154796165","https://openalex.org/W4322761281","https://openalex.org/W4238233472","https://openalex.org/W4313526662","https://openalex.org/W4312996489","https://openalex.org/W3111395152","https://openalex.org/W3106131444","https://openalex.org/W3216099748","https://openalex.org/W4205963435","https://openalex.org/W2893963003"],"abstract_inverted_index":{"Video":[0],"analytics":[1],"pipelines":[2],"incorporate":[3],"on-premise":[4],"edge":[5,22,107],"servers":[6,23],"to":[7,19,67,137],"lower":[8,26],"analysis":[9],"latency,":[10],"ensure":[11],"privacy,":[12],"and":[13,29,42,54,65,75,111],"reduce":[14,68],"bandwidth":[15],"requirements.":[16,143],"However,":[17],"compared":[18],"the":[20,33,69,94,106,141,153],"cloud,":[21],"typically":[24],"have":[25],"processing":[27],"power":[28],"GPU":[30],"memory,":[31],"limiting":[32],"number":[34],"of":[35,56],"video":[36],"streams":[37],"that":[38,103,112,129],"they":[39],"can":[40,119],"manage":[41],"analyze.":[43],"Existing":[44],"solutions":[45],"for":[46],"memory":[47,91,123,142],"management,":[48],"such":[49,130],"as":[50,87],"swapping":[51],"models":[52,104,118],"in":[53,121,135,140],"out":[55],"GPU,":[57],"having":[58],"a":[59],"common":[60,109,115],"model":[61,70,85,154],"stem,":[62],"or":[63],"compression":[64],"quantization":[66],"size":[71],"incur":[72],"high":[73],"overheads":[74],"often":[76],"provide":[77],"limited":[78],"benefits.":[79],"In":[80],"this":[81],"paper,":[82],"we":[83],"propose":[84],"merging":[86,113,155],"an":[88,131],"approach":[89,132],"towards":[90],"management":[92],"at":[93,105],"edge.":[95],"This":[96],"proposal":[97],"is":[98],"based":[99],"on":[100],"our":[101],"observation":[102],"share":[108],"layers,":[110],"these":[114],"layers":[116],"across":[117],"result":[120,134],"significant":[122],"savings.":[124],"Our":[125],"preliminary":[126],"evaluation":[127],"indicates":[128],"could":[133],"up":[136],"75%":[138],"savings":[139],"We":[144],"conclude":[145],"by":[146],"discussing":[147],"several":[148],"challenges":[149],"involved":[150],"with":[151],"realizing":[152],"vision.":[156]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
