{"id":"https://openalex.org/W4386597127","doi":"https://doi.org/10.1109/icip49359.2023.10222313","title":"Sandwiched Video Compression: Efficiently Extending the Reach of Standard Codecs with Neural Wrappers","display_name":"Sandwiched Video Compression: Efficiently Extending the Reach of Standard Codecs with Neural Wrappers","publication_year":2023,"publication_date":"2023-09-11","ids":{"openalex":"https://openalex.org/W4386597127","doi":"https://doi.org/10.1109/icip49359.2023.10222313"},"language":"en","primary_location":{"id":"doi:10.1109/icip49359.2023.10222313","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icip49359.2023.10222313","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Image Processing (ICIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5078939688","display_name":"Berivan Isik","orcid":"https://orcid.org/0000-0002-4926-5443"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Berivan Isik","raw_affiliation_strings":["Stanford University"],"affiliations":[{"raw_affiliation_string":"Stanford University","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028089028","display_name":"Onur G. Guleryuz","orcid":"https://orcid.org/0009-0007-8637-7181"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Onur G. Guleryuz","raw_affiliation_strings":["Google Research"],"affiliations":[{"raw_affiliation_string":"Google Research","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052922425","display_name":"Danhang Tang","orcid":"https://orcid.org/0000-0001-6164-8263"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Danhang Tang","raw_affiliation_strings":["Google Research"],"affiliations":[{"raw_affiliation_string":"Google Research","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036194594","display_name":"Jonathan Taylor","orcid":"https://orcid.org/0000-0002-2120-186X"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jonathan Taylor","raw_affiliation_strings":["Google Research"],"affiliations":[{"raw_affiliation_string":"Google Research","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019574907","display_name":"Philip A. Chou","orcid":"https://orcid.org/0000-0002-7242-0210"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Philip A. Chou","raw_affiliation_strings":["Google Research"],"affiliations":[{"raw_affiliation_string":"Google Research","institution_ids":["https://openalex.org/I1291425158"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5078939688"],"corresponding_institution_ids":["https://openalex.org/I97018004"],"apc_list":null,"apc_paid":null,"fwci":0.7379,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.72992856,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"2055","last_page":"2059"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10688","display_name":"Image and Signal Denoising Methods","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/codec","display_name":"Codec","score":0.9053718447685242},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8426352739334106},{"id":"https://openalex.org/keywords/motion-compensation","display_name":"Motion compensation","score":0.6582669019699097},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.594364583492279},{"id":"https://openalex.org/keywords/video-compression-picture-types","display_name":"Video compression picture types","score":0.4800582826137543},{"id":"https://openalex.org/keywords/quarter-pixel-motion","display_name":"Quarter-pixel motion","score":0.45891129970550537},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3703870475292206},{"id":"https://openalex.org/keywords/video-processing","display_name":"Video processing","score":0.35517382621765137},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.343586266040802},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.32708075642585754},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.2481881082057953},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.12741374969482422}],"concepts":[{"id":"https://openalex.org/C161765866","wikidata":"https://www.wikidata.org/wiki/Q184748","display_name":"Codec","level":2,"score":0.9053718447685242},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8426352739334106},{"id":"https://openalex.org/C128840427","wikidata":"https://www.wikidata.org/wiki/Q1302174","display_name":"Motion compensation","level":2,"score":0.6582669019699097},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.594364583492279},{"id":"https://openalex.org/C106030495","wikidata":"https://www.wikidata.org/wiki/Q1797012","display_name":"Video compression picture types","level":4,"score":0.4800582826137543},{"id":"https://openalex.org/C174493125","wikidata":"https://www.wikidata.org/wiki/Q1073461","display_name":"Quarter-pixel motion","level":3,"score":0.45891129970550537},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3703870475292206},{"id":"https://openalex.org/C65483669","wikidata":"https://www.wikidata.org/wiki/Q3536669","display_name":"Video processing","level":2,"score":0.35517382621765137},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.343586266040802},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.32708075642585754},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.2481881082057953},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.12741374969482422}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icip49359.2023.10222313","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icip49359.2023.10222313","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Image Processing (ICIP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1901129140","https://openalex.org/W1966156115","https://openalex.org/W1980275325","https://openalex.org/W2024066070","https://openalex.org/W2146395539","https://openalex.org/W2490784316","https://openalex.org/W2505609860","https://openalex.org/W2785562966","https://openalex.org/W2948562596","https://openalex.org/W2962785568","https://openalex.org/W2963149687","https://openalex.org/W2964098744","https://openalex.org/W2969260367","https://openalex.org/W2984671549","https://openalex.org/W2999940418","https://openalex.org/W3035195755","https://openalex.org/W3095497211","https://openalex.org/W3116240515","https://openalex.org/W3120676420","https://openalex.org/W3134368609","https://openalex.org/W3134748538","https://openalex.org/W3140899032","https://openalex.org/W3173272744","https://openalex.org/W3183391581","https://openalex.org/W3214878703","https://openalex.org/W4214743248","https://openalex.org/W4317600270","https://openalex.org/W4317600317","https://openalex.org/W6763117472","https://openalex.org/W6784418059"],"related_works":["https://openalex.org/W2187171999","https://openalex.org/W2084338435","https://openalex.org/W4233771325","https://openalex.org/W4392666742","https://openalex.org/W3020968992","https://openalex.org/W1524157000","https://openalex.org/W4386870095","https://openalex.org/W1491752883","https://openalex.org/W2051615313","https://openalex.org/W1889918572"],"abstract_inverted_index":{"We":[0,88],"propose":[1,89],"sandwiched":[2],"video":[3,7,17,32,73,94,130],"compression":[4,8,59,105],"\u2013":[5],"a":[6,15,24,30,43,67],"system":[9,136],"that":[10,171],"wraps":[11],"neural":[12,25,112],"networks":[13,37,180],"around":[14],"standard":[16,31,55,72,109,142],"codec.":[18],"The":[19,36],"sandwich":[20,116,135],"framework":[21],"consists":[22],"of":[23,50,114],"pre-":[26,172],"and":[27,85,97,173],"post-processor":[28],"with":[29,47,79],"codec":[33,56,95],"between":[34],"them.":[35],"are":[38],"trained":[39],"jointly":[40],"to":[41,92,102,118],"optimize":[42],"rate-distortion":[44,121],"loss":[45],"function":[46],"the":[48,54,71,108,111,115,134,147,160],"goal":[49],"significantly":[51,119],"improving":[52],"over":[53,107,141,163],"in":[57,63,100,123,157],"various":[58],"scenarios.":[60,126],"End-to-end":[61],"training":[62],"this":[64],"setting":[65],"requires":[66],"differentiable":[68,90],"proxy":[69],"for":[70],"codec,":[74,110],"which":[75],"incorporates":[76],"temporal":[77],"processing":[78],"motion":[80],"compensation,":[81],"inter/intra":[82],"mode":[83],"decisions,":[84],"in-loop":[86],"filtering.":[87],"approximations":[91],"key":[93],"components":[96],"demonstrate":[98],"that,":[99],"addition":[101],"providing":[103],"meaningful":[104],"improvements":[106,140,156],"codes":[113],"lead":[117],"better":[120],"performance":[122],"two":[124],"important":[125],"When":[127],"transporting":[128],"high-resolution":[129],"via":[131],"low-resolution":[132],"HEVC,":[133],"obtains":[137],"6.5":[138],"dB":[139],"HEVC.":[143,164],"More":[144],"importantly,":[145],"using":[146],"well-known":[148],"perceptual":[149],"similarity":[150],"metric,":[151],"LPIPS,":[152],"we":[153,169],"observe":[154],"30%":[155],"rate":[158],"at":[159],"same":[161],"quality":[162],"Last":[165],"but":[166],"not":[167],"least,":[168],"show":[170],"post-processors":[174],"formed":[175],"by":[176],"very":[177],"modestly-parameterized,":[178],"light-weight":[179],"can":[181],"closely":[182],"approximate":[183],"these":[184],"results.":[185]},"counts_by_year":[{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
