{"id":"https://openalex.org/W4406860217","doi":"https://doi.org/10.1109/vcip63160.2024.10849929","title":"Deep Reference Frame for Versatile Video Coding with Structural Re-parameterization","display_name":"Deep Reference Frame for Versatile Video Coding with Structural Re-parameterization","publication_year":2024,"publication_date":"2024-12-08","ids":{"openalex":"https://openalex.org/W4406860217","doi":"https://doi.org/10.1109/vcip63160.2024.10849929"},"language":"en","primary_location":{"id":"doi:10.1109/vcip63160.2024.10849929","is_oa":false,"landing_page_url":"https://doi.org/10.1109/vcip63160.2024.10849929","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Visual Communications and Image Processing (VCIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113144993","display_name":"C. Gui","orcid":"https://orcid.org/0009-0004-1423-4630"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chengzhuo Gui","raw_affiliation_strings":["Wuhan University,Hubei Luojia Laboratory,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,Hubei Luojia Laboratory,Wuhan,China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049991780","display_name":"Yuantong Zhang","orcid":"https://orcid.org/0000-0002-1473-940X"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuantong Zhang","raw_affiliation_strings":["Wuhan University,School of Remote Sensing and Information Engineering,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,School of Remote Sensing and Information Engineering,Wuhan,China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020651536","display_name":"Weijie Bao","orcid":"https://orcid.org/0000-0002-9039-1257"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weijie Bao","raw_affiliation_strings":["Wuhan University,School of Remote Sensing and Information Engineering,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,School of Remote Sensing and Information Engineering,Wuhan,China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006748765","display_name":"Zhenzhong Chen","orcid":"https://orcid.org/0000-0002-7882-1066"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhenzhong Chen","raw_affiliation_strings":["Wuhan University,School of Remote Sensing and Information Engineering,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,School of Remote Sensing and Information Engineering,Wuhan,China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050242390","display_name":"Huairui Wang","orcid":"https://orcid.org/0009-0004-2870-6117"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huairui Wang","raw_affiliation_strings":["Tencent,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Tencent,Shenzhen,China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100449791","display_name":"Shan Liu","orcid":"https://orcid.org/0000-0003-1847-8769"},"institutions":[{"id":"https://openalex.org/I70745867","display_name":"KLA (United States)","ror":"https://ror.org/02rqhpa98","country_code":"US","type":"company","lineage":["https://openalex.org/I70745867"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shan Liu","raw_affiliation_strings":["Tencent America,Palo Alto,CA,USA"],"affiliations":[{"raw_affiliation_string":"Tencent America,Palo Alto,CA,USA","institution_ids":["https://openalex.org/I70745867"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5113144993"],"corresponding_institution_ids":["https://openalex.org/I37461747"],"apc_list":null,"apc_paid":null,"fwci":0.3735,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.62461851,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10741","display_name":"Video Coding and Compression Technologies","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10741","display_name":"Video Coding and Compression Technologies","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9939000010490417,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13579","display_name":"Image and Video Stabilization","score":0.9894000291824341,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7302201986312866},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.583490788936615},{"id":"https://openalex.org/keywords/reference-frame","display_name":"Reference frame","score":0.5185935497283936},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.4775579571723938},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35226577520370483},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3209896683692932},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.17119723558425903},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08436417579650879}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7302201986312866},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.583490788936615},{"id":"https://openalex.org/C172849965","wikidata":"https://www.wikidata.org/wiki/Q3148875","display_name":"Reference frame","level":3,"score":0.5185935497283936},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.4775579571723938},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35226577520370483},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3209896683692932},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.17119723558425903},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08436417579650879},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/vcip63160.2024.10849929","is_oa":false,"landing_page_url":"https://doi.org/10.1109/vcip63160.2024.10849929","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Visual Communications and Image Processing (VCIP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W2769654144","https://openalex.org/W2896406755","https://openalex.org/W2943766642","https://openalex.org/W2963109922","https://openalex.org/W2963189365","https://openalex.org/W2967151712","https://openalex.org/W2982083293","https://openalex.org/W2998645105","https://openalex.org/W3013052828","https://openalex.org/W3085258535","https://openalex.org/W3135530072","https://openalex.org/W3167976421","https://openalex.org/W3171038842","https://openalex.org/W3188610266","https://openalex.org/W4293363567","https://openalex.org/W4304080653","https://openalex.org/W4312770027","https://openalex.org/W4318617422","https://openalex.org/W4385453475","https://openalex.org/W4391306830","https://openalex.org/W6737664043","https://openalex.org/W6749781174","https://openalex.org/W6870133103"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"In":[0,47],"video":[1],"coding,":[2],"inter-prediction":[3],"leverages":[4],"neigh-boring":[5],"frames":[6,16],"to":[7,30,71,115,145],"reduce":[8],"temporal":[9],"redundancy.":[10],"The":[11],"quality":[12,33],"of":[13,34],"these":[14],"reference":[15,35,67],"is":[17,38],"essential":[18],"for":[19,41,59,136],"effective":[20,94],"inter-prediction.":[21],"Although":[22],"many":[23],"neural":[24],"network-based":[25],"methods":[26],"have":[27],"been":[28],"proposed":[29],"improve":[31,72],"the":[32,42],"frames,":[36],"there":[37],"still":[39],"room":[40],"performance":[43,73,100,121],"and":[44,77,99,122],"efficiency":[45,134],"trade-off.":[46],"this":[48],"paper,":[49],"we":[50,81,103],"propose":[51,82,104],"an":[52],"interpolation":[53,62,69],"diverse":[54],"branch":[55],"block":[56,87],"(InterDBB)":[57],"suitable":[58],"lightweight":[60],"frame":[61,68],"networks,":[63],"which":[64],"optimizes":[65],"deep":[66],"networks":[70],"without":[74,88],"sacrificing":[75],"speed":[76],"increasing":[78],"complexity.":[79,124],"Specifically,":[80],"a":[83,105,117],"multi-branch":[84],"structural":[85],"reparameterization":[86],"batch":[89],"normalization.":[90],"This":[91],"straightforward":[92],"yet":[93],"modification":[95],"ensures":[96],"training":[97],"stability":[98],"improvement.":[101],"Moreover,":[102],"parameterized":[106],"motion":[107],"estimation":[108],"strategy":[109],"based":[110],"on":[111],"different":[112],"input":[113],"resolution,":[114],"achieve":[116],"better":[118],"trade-off":[119],"between":[120],"computational":[123],"Experimental":[125],"results":[126],"demonstrate":[127],"that":[128],"our":[129],"method":[130],"achieves":[131],"-2.01%/-2.87%/-2.44%":[132],"coding":[133],"improvements":[135],"Y/U/V":[137],"components":[138],"under":[139],"random":[140],"access":[141],"(RA)":[142],"configuration":[143],"compared":[144],"VTM-11.0_NNVC-5.0.":[146]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-21T01:58:51.020947","created_date":"2025-10-10T00:00:00"}
