{"id":"https://openalex.org/W3203188499","doi":"https://doi.org/10.1109/tip.2022.3231082","title":"Self-Supervised Learning of Perceptually Optimized Block Motion Estimates for Video Compression","display_name":"Self-Supervised Learning of Perceptually Optimized Block Motion Estimates for Video Compression","publication_year":2022,"publication_date":"2022-12-27","ids":{"openalex":"https://openalex.org/W3203188499","doi":"https://doi.org/10.1109/tip.2022.3231082","mag":"3203188499","pmid":"https://pubmed.ncbi.nlm.nih.gov/37015500"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2022.3231082","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2022.3231082","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031583853","display_name":"Somdyuti Paul","orcid":"https://orcid.org/0000-0002-2762-7263"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Somdyuti Paul","raw_affiliation_strings":["Department of Electrical and Computer Engineering, The University of Texas at Austin, Austin, TX, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, The University of Texas at Austin, Austin, TX, USA","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056447210","display_name":"Andrey Norkin","orcid":"https://orcid.org/0000-0002-2417-1635"},"institutions":[{"id":"https://openalex.org/I869089601","display_name":"Netflix (United States)","ror":"https://ror.org/0197qw696","country_code":"US","type":"company","lineage":["https://openalex.org/I869089601"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Andrey Norkin","raw_affiliation_strings":["Netflix, Inc, Los Gatos, CA, USA"],"affiliations":[{"raw_affiliation_string":"Netflix, Inc, Los Gatos, CA, USA","institution_ids":["https://openalex.org/I869089601"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075463806","display_name":"Alan C. Bovik","orcid":"https://orcid.org/0000-0001-6067-710X"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alan C. Bovik","raw_affiliation_strings":["Department of Electrical and Computer Engineering, The University of Texas at Austin, Austin, TX, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, The University of Texas at Austin, Austin, TX, USA","institution_ids":["https://openalex.org/I86519309"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5031583853"],"corresponding_institution_ids":["https://openalex.org/I86519309"],"apc_list":null,"apc_paid":null,"fwci":0.5094,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.61794684,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"32","issue":null,"first_page":"617","last_page":"630"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.6905855536460876},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6761673092842102},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6692404747009277},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5997568964958191},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.5389654636383057},{"id":"https://openalex.org/keywords/motion-estimation","display_name":"Motion estimation","score":0.49621230363845825},{"id":"https://openalex.org/keywords/compression","display_name":"Compression (physics)","score":0.4730460047721863},{"id":"https://openalex.org/keywords/motion-compensation","display_name":"Motion compensation","score":0.43024274706840515},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.4257514178752899},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4178074896335602},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.24564692378044128}],"concepts":[{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.6905855536460876},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6761673092842102},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6692404747009277},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5997568964958191},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.5389654636383057},{"id":"https://openalex.org/C10161872","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Motion estimation","level":2,"score":0.49621230363845825},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.4730460047721863},{"id":"https://openalex.org/C128840427","wikidata":"https://www.wikidata.org/wiki/Q1302174","display_name":"Motion compensation","level":2,"score":0.43024274706840515},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.4257514178752899},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4178074896335602},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.24564692378044128},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tip.2022.3231082","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2022.3231082","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:37015500","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/37015500","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":55,"referenced_works":["https://openalex.org/W603908379","https://openalex.org/W764651262","https://openalex.org/W1522301498","https://openalex.org/W1580389772","https://openalex.org/W1973207880","https://openalex.org/W1978479866","https://openalex.org/W2004185490","https://openalex.org/W2019612949","https://openalex.org/W2064428286","https://openalex.org/W2097787789","https://openalex.org/W2101700394","https://openalex.org/W2123950557","https://openalex.org/W2133665775","https://openalex.org/W2145251738","https://openalex.org/W2147253850","https://openalex.org/W2276329208","https://openalex.org/W2507953016","https://openalex.org/W2548527721","https://openalex.org/W2596816328","https://openalex.org/W2620258460","https://openalex.org/W2751105188","https://openalex.org/W2761287863","https://openalex.org/W2791561215","https://openalex.org/W2792448276","https://openalex.org/W2793408333","https://openalex.org/W2802358283","https://openalex.org/W2802934755","https://openalex.org/W2891639355","https://openalex.org/W2896754546","https://openalex.org/W2901921200","https://openalex.org/W2913664580","https://openalex.org/W2963782415","https://openalex.org/W2963891416","https://openalex.org/W2969260367","https://openalex.org/W2972765469","https://openalex.org/W2980441643","https://openalex.org/W2984671549","https://openalex.org/W2992051623","https://openalex.org/W3008317530","https://openalex.org/W3010458743","https://openalex.org/W3026315686","https://openalex.org/W3031546776","https://openalex.org/W3045512288","https://openalex.org/W3080277927","https://openalex.org/W3089562308","https://openalex.org/W3100456687","https://openalex.org/W3101531460","https://openalex.org/W3103682398","https://openalex.org/W3131833214","https://openalex.org/W3155750884","https://openalex.org/W4205891041","https://openalex.org/W4303074198","https://openalex.org/W6618372016","https://openalex.org/W6631190155","https://openalex.org/W6738461048"],"related_works":["https://openalex.org/W1579157894","https://openalex.org/W1967654336","https://openalex.org/W2060632806","https://openalex.org/W1530267862","https://openalex.org/W2995690499","https://openalex.org/W1494405360","https://openalex.org/W2050955821","https://openalex.org/W2153529351","https://openalex.org/W2040149295","https://openalex.org/W2016848112"],"abstract_inverted_index":{"Block":[0],"based":[1,18,185,241],"motion":[2,26,73,89,96,110,165,186,242],"estimation":[3,97,111,187,243],"is":[4,50,106,130],"integral":[5],"to":[6,23,44,108,158,181,196,223,237],"inter":[7,198],"prediction":[8,191,199],"processes":[9],"performed":[10],"in":[11,58,132,200,211,246],"hybrid":[12],"video":[13,147],"codecs.":[14],"Prevalent":[15],"block":[16,25,48,54,95,114,126,183,239],"matching":[17,55,184,240],"methods":[19],"that":[20,76,140],"are":[21,77],"used":[22,57,195],"compute":[24],"vectors":[27],"(MVs)":[28],"rely":[29],"on":[30,112,136],"computationally":[31],"intensive":[32],"search":[33],"procedures.":[34],"They":[35],"also":[36],"suffer":[37],"from":[38,143],"the":[39,47,53,65,72,83,151,160,164,173,202,206,224,238,247],"aperture":[40],"problem,":[41],"which":[42,105],"tends":[43],"worsen":[45],"as":[46,122,235],"size":[49],"reduced.":[51],"Moreover,":[52],"criteria":[56],"typical":[59],"codecs":[60],"do":[61],"not":[62],"account":[63],"for":[64,189],"resulting":[66],"levels":[67],"of":[68,71,86,120,163,176,205,217],"perceptual":[69,161],"quality":[70,162,232],"compensated":[74,166],"pictures":[75],"created":[78,142],"upon":[79],"decoding.":[80],"Towards":[81],"achieving":[82],"elusive":[84],"goal":[85],"perceptually":[87,207],"optimized":[88,208],"estimation,":[90],"we":[91,141],"propose":[92],"a":[93,100,118,133,137],"search-free":[94],"framework":[98],"using":[99,117],"multi-stage":[101],"convolutional":[102],"neural":[103],"network,":[104],"able":[107],"conduct":[109],"multiple":[113],"sizes":[115],"simultaneously,":[116],"triplet":[119],"frames":[121],"input.":[123],"This":[124],"composite":[125],"translation":[127],"network":[128],"(CBT-Net)":[129],"trained":[131],"self-supervised":[134],"manner":[135],"large":[138],"database":[139],"publicly":[144],"available":[145],"uncompressed":[146],"content.":[148],"We":[149],"deploy":[150],"multi-scale":[152],"structural":[153],"similarity":[154],"(MS-SSIM)":[155],"loss":[156],"function":[157],"optimize":[159],"predicted":[167],"frames.":[168],"Our":[169],"experimental":[170],"results":[171],"highlight":[172],"computational":[174],"efficiency":[175],"our":[177],"proposed":[178],"model":[179,209],"relative":[180],"conventional":[182],"algorithms,":[188],"comparable":[190],"errors.":[192],"Further,":[193],"when":[194],"perform":[197],"AV1,":[201],"MV":[203],"predictions":[204],"result":[210],"average":[212],"Bj\u00f8ntegaard-delta":[213],"rate":[214],"(BD-rate)":[215],"improvements":[216],"-1.73%":[218],"and":[219,226],"-1.31%":[220],"with":[221],"respect":[222],"MS-SSIM":[225],"Video":[227],"Multi-Method":[228],"Assessment":[229],"Fusion":[230],"(VMAF)":[231],"metrics,":[233],"respectively,":[234],"compared":[236],"system":[244],"employed":[245],"SVT-AV1":[248],"encoder.":[249]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
