{"id":"https://openalex.org/W7131316944","doi":"https://doi.org/10.1109/vcip67698.2025.11396894","title":"Lightweight Motion-Vector-Based Segmentation Mask Tracking for Saliency-Based Rate Control","display_name":"Lightweight Motion-Vector-Based Segmentation Mask Tracking for Saliency-Based Rate Control","publication_year":2025,"publication_date":"2025-12-01","ids":{"openalex":"https://openalex.org/W7131316944","doi":"https://doi.org/10.1109/vcip67698.2025.11396894"},"language":"en","primary_location":{"id":"doi:10.1109/vcip67698.2025.11396894","is_oa":false,"landing_page_url":"https://doi.org/10.1109/vcip67698.2025.11396894","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Visual Communications and Image Processing (VCIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126673606","display_name":"Minh Hoang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210133110","display_name":"Tampere University","ror":null,"country_code":"FI","type":null,"lineage":["https://openalex.org/I4210133110"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Minh Hoang","raw_affiliation_strings":["Ultra Video Group, Tampere University,Tampere,Finland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Ultra Video Group, Tampere University,Tampere,Finland","institution_ids":["https://openalex.org/I4210133110"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059056398","display_name":"Tero Partanen","orcid":"https://orcid.org/0000-0002-9975-0535"},"institutions":[{"id":"https://openalex.org/I4210133110","display_name":"Tampere University","ror":null,"country_code":"FI","type":null,"lineage":["https://openalex.org/I4210133110"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Tero Partanen","raw_affiliation_strings":["Ultra Video Group, Tampere University,Tampere,Finland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Ultra Video Group, Tampere University,Tampere,Finland","institution_ids":["https://openalex.org/I4210133110"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002772631","display_name":"Jarno Vanne","orcid":"https://orcid.org/0000-0002-7944-1938"},"institutions":[{"id":"https://openalex.org/I4210133110","display_name":"Tampere University","ror":null,"country_code":"FI","type":null,"lineage":["https://openalex.org/I4210133110"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Jarno Vanne","raw_affiliation_strings":["Ultra Video Group, Tampere University,Tampere,Finland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Ultra Video Group, Tampere University,Tampere,Finland","institution_ids":["https://openalex.org/I4210133110"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065615731","display_name":"Alexandre Mercat","orcid":"https://orcid.org/0000-0003-2211-970X"},"institutions":[{"id":"https://openalex.org/I4210133110","display_name":"Tampere University","ror":null,"country_code":"FI","type":null,"lineage":["https://openalex.org/I4210133110"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Alexandre Mercat","raw_affiliation_strings":["Ultra Video Group, Tampere University,Tampere,Finland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Ultra Video Group, Tampere University,Tampere,Finland","institution_ids":["https://openalex.org/I4210133110"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I4210133110"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.61644911,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.1395999938249588,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.1395999938249588,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.10450000315904617,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.06889999657869339,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7369999885559082},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.6327999830245972},{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.5174999833106995},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.49970000982284546},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.4648999869823456},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.4629000127315521},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.4154999852180481},{"id":"https://openalex.org/keywords/scale-space-segmentation","display_name":"Scale-space segmentation","score":0.41100001335144043}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7577999830245972},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7512999773025513},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7473999857902527},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7369999885559082},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.6327999830245972},{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.5174999833106995},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.49970000982284546},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.4648999869823456},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.4629000127315521},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.4154999852180481},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.41100001335144043},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.3720000088214874},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.3538999855518341},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.35100001096725464},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.3476000130176544},{"id":"https://openalex.org/C25694479","wikidata":"https://www.wikidata.org/wiki/Q7446278","display_name":"Segmentation-based object categorization","level":5,"score":0.3197000026702881},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.31630000472068787},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.31459999084472656},{"id":"https://openalex.org/C154586513","wikidata":"https://www.wikidata.org/wiki/Q4420972","display_name":"Tracking system","level":3,"score":0.29750001430511475},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.2687999904155731},{"id":"https://openalex.org/C56461940","wikidata":"https://www.wikidata.org/wiki/Q970687","display_name":"Eye tracking","level":2,"score":0.26510000228881836},{"id":"https://openalex.org/C43711488","wikidata":"https://www.wikidata.org/wiki/Q7534783","display_name":"Skew","level":2,"score":0.25459998846054077},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2517000138759613}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/vcip67698.2025.11396894","is_oa":false,"landing_page_url":"https://doi.org/10.1109/vcip67698.2025.11396894","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Visual Communications and Image Processing (VCIP)","raw_type":"proceedings-article"},{"id":"pmh:oai:trepo.tuni.fi:10024/234819","is_oa":false,"landing_page_url":"https://trepo.tuni.fi/handle/10024/234819","pdf_url":null,"source":{"id":"https://openalex.org/S7407055260","display_name":"Trepo - Institutional Repository of Tampere University","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"conference"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320328501","display_name":"Business Finland","ror":"https://ror.org/05bgf9v38"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W1995903777","https://openalex.org/W2131070359","https://openalex.org/W2146395539","https://openalex.org/W2340897893","https://openalex.org/W2531409750","https://openalex.org/W2575115075","https://openalex.org/W2890125283","https://openalex.org/W2922350647","https://openalex.org/W2948672349","https://openalex.org/W2962967409","https://openalex.org/W3034199015","https://openalex.org/W3082045773","https://openalex.org/W3098621856","https://openalex.org/W3106734873","https://openalex.org/W3118212025","https://openalex.org/W3159734877","https://openalex.org/W3202918664","https://openalex.org/W4239147634","https://openalex.org/W4386575106","https://openalex.org/W4396808786","https://openalex.org/W4404577090","https://openalex.org/W4406013928","https://openalex.org/W4406867249"],"related_works":[],"abstract_inverted_index":{"In":[0],"video":[1,70],"encoding,":[2],"saliency-based":[3],"rate":[4],"control":[5],"improves":[6],"coding":[7],"efficiency":[8],"without":[9],"compromising":[10],"perceptual":[11],"quality":[12],"by":[13,55],"allocating":[14],"more":[15,36],"bits":[16],"to":[17,45,74,134,157],"visually":[18],"important":[19],"regions.":[20],"While":[21],"object":[22,40],"detection":[23],"can":[24],"guide":[25],"bit":[26],"allocation":[27],"through":[28],"rectangular":[29],"bounding":[30],"boxes,":[31],"segmentation":[32,54,59,86,124],"masks":[33],"offer":[34],"a":[35,57,90,99,127,158,163],"accurate":[37],"delineation":[38],"of":[39,51,118,121],"boundaries.":[41],"This":[42],"paper":[43],"seeks":[44],"reduce":[46],"the":[47,69,113,119,139,142],"significant":[48],"computational":[49,106,132],"burden":[50],"frame-by-frame":[52,122],"instance":[53,123],"proposing":[56],"lightweight":[58],"mask":[60,87],"tracking":[61,95,153],"scheme,":[62],"in":[63,152],"which":[64],"motion":[65],"vectors":[66],"(MVs)":[67],"from":[68],"encoder":[71],"are":[72,145],"used":[73],"predict":[75],"per-vertex":[76],"displacements.":[77],"Altogether,":[78],"we":[79],"propose":[80],"two":[81],"neural":[82],"network":[83],"designs":[84],"for":[85,94,166],"tracking:":[88],"(1)":[89],"base":[91,114],"tracker":[92,101,115],"optimized":[93],"accuracy;":[96],"and":[97,105,130,148],"(2)":[98],"lite":[100,140],"that":[102,112],"balances":[103],"accuracy":[104,120],"complexity.":[107],"Our":[108],"experimental":[109],"results":[110],"show":[111],"attains":[116],"70-88%":[117],"but":[125],"achieves":[126],"48\u00d7":[128],"speedup":[129],"reduces":[131],"complexity":[133,156],"0.03%":[135],"on":[136],"CPU.":[137],"For":[138],"tracker,":[141],"corresponding":[143],"figures":[144],"49\u00d7,":[146],"0.01%,":[147],"67-88%.":[149],"Despite":[150],"tradeoffs":[151],"accuracy,":[154],"reducing":[155],"fraction":[159],"makes":[160],"our":[161],"solution":[162],"viable":[164],"option":[165],"practical":[167],"applications.":[168]},"counts_by_year":[],"updated_date":"2026-07-02T09:51:11.867554","created_date":"2026-02-25T00:00:00"}
