{"id":"https://openalex.org/W3113596896","doi":"https://doi.org/10.1109/mmsp48831.2020.9287114","title":"VMAF Based Rate-Distortion Optimization for Video Coding","display_name":"VMAF Based Rate-Distortion Optimization for Video Coding","publication_year":2020,"publication_date":"2020-09-21","ids":{"openalex":"https://openalex.org/W3113596896","doi":"https://doi.org/10.1109/mmsp48831.2020.9287114","mag":"3113596896"},"language":"en","primary_location":{"id":"doi:10.1109/mmsp48831.2020.9287114","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mmsp48831.2020.9287114","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE 22nd International Workshop on Multimedia Signal Processing (MMSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080104324","display_name":"Sai Deng","orcid":"https://orcid.org/0000-0002-3681-4888"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sai Deng","raw_affiliation_strings":["WebM Codec Team, Google LLC, Mountain View, CA"],"affiliations":[{"raw_affiliation_string":"WebM Codec Team, Google LLC, Mountain View, CA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046233912","display_name":"Jingning Han","orcid":"https://orcid.org/0000-0001-7168-2254"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jingning Han","raw_affiliation_strings":["WebM Codec Team, Google LLC, Mountain View, CA"],"affiliations":[{"raw_affiliation_string":"WebM Codec Team, Google LLC, Mountain View, CA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103766279","display_name":"Yaowu Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yaowu Xu","raw_affiliation_strings":["WebM Codec Team, Google LLC, Mountain View, CA"],"affiliations":[{"raw_affiliation_string":"WebM Codec Team, Google LLC, Mountain View, CA","institution_ids":["https://openalex.org/I1291425158"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5080104324"],"corresponding_institution_ids":["https://openalex.org/I1291425158"],"apc_list":null,"apc_paid":null,"fwci":1.3678,"has_fulltext":false,"cited_by_count":21,"citation_normalized_percentile":{"value":0.84005512,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/rate\u2013distortion-optimization","display_name":"Rate\u2013distortion optimization","score":0.8065069913864136},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7422100901603699},{"id":"https://openalex.org/keywords/peak-signal-to-noise-ratio","display_name":"Peak signal-to-noise ratio","score":0.6176198124885559},{"id":"https://openalex.org/keywords/video-quality","display_name":"Video quality","score":0.6107087731361389},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5958722233772278},{"id":"https://openalex.org/keywords/codec","display_name":"Codec","score":0.5897292494773865},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.5590354204177856},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.5227765440940857},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4393061399459839},{"id":"https://openalex.org/keywords/distortion","display_name":"Distortion (music)","score":0.41063442826271057},{"id":"https://openalex.org/keywords/multiview-video-coding","display_name":"Multiview Video Coding","score":0.366535484790802},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3630799353122711},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.3490552306175232},{"id":"https://openalex.org/keywords/video-processing","display_name":"Video processing","score":0.3120892643928528},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.18032661080360413},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.09520503878593445},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.09295693039894104},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.09029009938240051}],"concepts":[{"id":"https://openalex.org/C50056821","wikidata":"https://www.wikidata.org/wiki/Q774502","display_name":"Rate\u2013distortion optimization","level":5,"score":0.8065069913864136},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7422100901603699},{"id":"https://openalex.org/C154579607","wikidata":"https://www.wikidata.org/wiki/Q3373850","display_name":"Peak signal-to-noise ratio","level":3,"score":0.6176198124885559},{"id":"https://openalex.org/C103910844","wikidata":"https://www.wikidata.org/wiki/Q2631256","display_name":"Video quality","level":3,"score":0.6107087731361389},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5958722233772278},{"id":"https://openalex.org/C161765866","wikidata":"https://www.wikidata.org/wiki/Q184748","display_name":"Codec","level":2,"score":0.5897292494773865},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5590354204177856},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.5227765440940857},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4393061399459839},{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.41063442826271057},{"id":"https://openalex.org/C23431618","wikidata":"https://www.wikidata.org/wiki/Q1404672","display_name":"Multiview Video Coding","level":4,"score":0.366535484790802},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3630799353122711},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.3490552306175232},{"id":"https://openalex.org/C65483669","wikidata":"https://www.wikidata.org/wiki/Q3536669","display_name":"Video processing","level":2,"score":0.3120892643928528},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.18032661080360413},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.09520503878593445},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.09295693039894104},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.09029009938240051},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C194257627","wikidata":"https://www.wikidata.org/wiki/Q211554","display_name":"Amplifier","level":3,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/mmsp48831.2020.9287114","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mmsp48831.2020.9287114","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE 22nd International Workshop on Multimedia Signal Processing (MMSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W1984288074","https://openalex.org/W2046119925","https://openalex.org/W2117804578","https://openalex.org/W2169161136","https://openalex.org/W2891639355","https://openalex.org/W2943811461","https://openalex.org/W2970590196","https://openalex.org/W2989752519","https://openalex.org/W6767729413"],"related_works":["https://openalex.org/W2045735464","https://openalex.org/W2104624537","https://openalex.org/W2099031831","https://openalex.org/W1982720242","https://openalex.org/W4388134597","https://openalex.org/W2113471818","https://openalex.org/W101275777","https://openalex.org/W4389390133","https://openalex.org/W2123694428","https://openalex.org/W4361854065"],"abstract_inverted_index":{"Video":[0],"Multi-method":[1],"Assessment":[2],"Fusion":[3],"(VMAF)":[4],"is":[5,13,71],"a":[6,59,77,81,88],"machine-learning":[7],"based":[8],"video":[9,65,112],"quality":[10],"metric.":[11,96],"It":[12,70],"experimentally":[14],"shown":[15],"to":[16,26,51,62,110],"provide":[17],"higher":[18],"correlation":[19],"with":[20,80],"human":[21],"visual":[22],"system":[23],"as":[24,47,108],"compared":[25,109],"conventional":[27,111],"metrics":[28],"like":[29],"peak":[30],"signal-to-noise":[31],"ratio":[32],"(PSNR)":[33],"and":[34,42,87],"structural":[35],"similarity":[36],"index":[37],"(SSIM)":[38],"in":[39,68,106],"many":[40],"scenarios":[41],"has":[43],"drawn":[44],"considerable":[45],"interest":[46],"an":[48],"alternative":[49],"metric":[50],"evaluate":[52],"the":[53,64],"perceptual":[54],"quality.":[55],"This":[56],"work":[57],"proposes":[58],"systematic":[60],"approach":[61],"improve":[63],"compression":[66],"performance":[67],"VMAF.":[69],"composed":[72],"of":[73],"multiple":[74],"components":[75],"including":[76],"pre-processing":[78],"stage":[79],"complement":[82],"automatic":[83],"filter":[84],"parameter":[85],"selection,":[86],"modified":[89],"rate-distortion":[90],"optimization":[91],"framework":[92],"tailored":[93],"for":[94,115],"VMAF":[95],"The":[97],"proposed":[98],"scheme":[99],"achieves":[100],"on":[101],"average":[102],"37%":[103],"BD-rate":[104],"reduction":[105],"VMAF,":[107],"codec":[113],"optimized":[114],"PSNR.":[116]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
