{"id":"https://openalex.org/W4387490618","doi":"https://doi.org/10.1109/tcsvt.2023.3323483","title":"Joint Pixel and Frequency Feature Learning and Fusion via Channel-Wise Transformer for High-Efficiency Learned In-Loop Filter in VVC","display_name":"Joint Pixel and Frequency Feature Learning and Fusion via Channel-Wise Transformer for High-Efficiency Learned In-Loop Filter in VVC","publication_year":2023,"publication_date":"2023-10-10","ids":{"openalex":"https://openalex.org/W4387490618","doi":"https://doi.org/10.1109/tcsvt.2023.3323483"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2023.3323483","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3323483","pdf_url":"https://ieeexplore.ieee.org/ielx7/76/4358651/10275101.pdf","source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://ieeexplore.ieee.org/ielx7/76/4358651/10275101.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036691509","display_name":"Birendra Kathariya","orcid":"https://orcid.org/0000-0001-9297-8978"},"institutions":[{"id":"https://openalex.org/I75421653","display_name":"University of Missouri\u2013Kansas City","ror":"https://ror.org/01w0d5g70","country_code":"US","type":"education","lineage":["https://openalex.org/I75421653"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Birendra Kathariya","raw_affiliation_strings":["Department of Computer Science and Electrical Engineering, University of Missouri-Kansas City, Kansas City, MO, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Electrical Engineering, University of Missouri-Kansas City, Kansas City, MO, USA","institution_ids":["https://openalex.org/I75421653"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100380625","display_name":"Zhu Li","orcid":"https://orcid.org/0000-0002-8246-177X"},"institutions":[{"id":"https://openalex.org/I75421653","display_name":"University of Missouri\u2013Kansas City","ror":"https://ror.org/01w0d5g70","country_code":"US","type":"education","lineage":["https://openalex.org/I75421653"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhu Li","raw_affiliation_strings":["Department of Computer Science and Electrical Engineering, University of Missouri-Kansas City, Kansas City, MO, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Electrical Engineering, University of Missouri-Kansas City, Kansas City, MO, USA","institution_ids":["https://openalex.org/I75421653"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083485280","display_name":"Geert Van der Auwera","orcid":"https://orcid.org/0000-0001-7791-4829"},"institutions":[{"id":"https://openalex.org/I4210087596","display_name":"Qualcomm (United States)","ror":"https://ror.org/002zrf773","country_code":"US","type":"company","lineage":["https://openalex.org/I4210087596"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Geert Van der Auwera","raw_affiliation_strings":["Qualcomm Technologies Inc, San Diego, CA, USA"],"affiliations":[{"raw_affiliation_string":"Qualcomm Technologies Inc, San Diego, CA, USA","institution_ids":["https://openalex.org/I4210087596"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5036691509"],"corresponding_institution_ids":["https://openalex.org/I75421653"],"apc_list":null,"apc_paid":null,"fwci":2.4072,"has_fulltext":true,"cited_by_count":20,"citation_normalized_percentile":{"value":0.90910399,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"34","issue":"5","first_page":"4070","last_page":"4083"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10688","display_name":"Image and Signal Denoising Methods","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7715117931365967},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5634316802024841},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5483397841453552},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.5343543291091919},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4844262897968292},{"id":"https://openalex.org/keywords/codec","display_name":"Codec","score":0.45968884229660034},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.45747897028923035},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4106272757053375},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.36261802911758423},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.32227784395217896},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.13156616687774658},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09623542428016663}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7715117931365967},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5634316802024841},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5483397841453552},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.5343543291091919},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4844262897968292},{"id":"https://openalex.org/C161765866","wikidata":"https://www.wikidata.org/wiki/Q184748","display_name":"Codec","level":2,"score":0.45968884229660034},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.45747897028923035},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4106272757053375},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.36261802911758423},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.32227784395217896},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.13156616687774658},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09623542428016663},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2023.3323483","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3323483","pdf_url":"https://ieeexplore.ieee.org/ielx7/76/4358651/10275101.pdf","source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1109/tcsvt.2023.3323483","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3323483","pdf_url":"https://ieeexplore.ieee.org/ielx7/76/4358651/10275101.pdf","source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8432471258","display_name":null,"funder_award_id":"2148382","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320308258","display_name":"Qualcomm","ror":"https://ror.org/002zrf773"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4387490618.pdf","grobid_xml":"https://content.openalex.org/works/W4387490618.grobid-xml"},"referenced_works_count":58,"referenced_works":["https://openalex.org/W1885185971","https://openalex.org/W2017801928","https://openalex.org/W2064674198","https://openalex.org/W2097117768","https://openalex.org/W2123113293","https://openalex.org/W2146395539","https://openalex.org/W2147000487","https://openalex.org/W2194775991","https://openalex.org/W2477177239","https://openalex.org/W2519021537","https://openalex.org/W2552465432","https://openalex.org/W2604272474","https://openalex.org/W2892020820","https://openalex.org/W2915130236","https://openalex.org/W2942071819","https://openalex.org/W2963343778","https://openalex.org/W2963372104","https://openalex.org/W2963446712","https://openalex.org/W2963494934","https://openalex.org/W2964077901","https://openalex.org/W2965217508","https://openalex.org/W2966431607","https://openalex.org/W2968397583","https://openalex.org/W2969260367","https://openalex.org/W2970872821","https://openalex.org/W2985577924","https://openalex.org/W2999132674","https://openalex.org/W3000775737","https://openalex.org/W3034782636","https://openalex.org/W3038753503","https://openalex.org/W3043029414","https://openalex.org/W3080437795","https://openalex.org/W3081342944","https://openalex.org/W3090654092","https://openalex.org/W3104949790","https://openalex.org/W3153323090","https://openalex.org/W3164064764","https://openalex.org/W3166014221","https://openalex.org/W3169596802","https://openalex.org/W3172995745","https://openalex.org/W3189180948","https://openalex.org/W3202040256","https://openalex.org/W3202918664","https://openalex.org/W3207918547","https://openalex.org/W4220715488","https://openalex.org/W4224130636","https://openalex.org/W4224294196","https://openalex.org/W4287020683","https://openalex.org/W4292829111","https://openalex.org/W4312396555","https://openalex.org/W4312812783","https://openalex.org/W4316660221","https://openalex.org/W4317555198","https://openalex.org/W4367146862","https://openalex.org/W6684191040","https://openalex.org/W6725739302","https://openalex.org/W6766847852","https://openalex.org/W6799637880"],"related_works":["https://openalex.org/W2964213236","https://openalex.org/W2163719598","https://openalex.org/W3161919736","https://openalex.org/W2387018512","https://openalex.org/W2107680156","https://openalex.org/W4301184752","https://openalex.org/W2288771647","https://openalex.org/W2751422192","https://openalex.org/W2008888243","https://openalex.org/W4309346246"],"abstract_inverted_index":{"Block-based":[0],"video":[1,78],"codecs":[2,25],"such":[3],"as":[4,49,238,240],"Versatile":[5],"Video":[6,11,15],"Coding":[7,12,16],"(VVC)/H.266,":[8],"High":[9],"Efficiency":[10],"(HEVC)/H.265,":[13],"Advanced":[14],"(AVC)/H.264":[17],"etc.":[18],"inherently":[19],"introduces":[20,167],"compression":[21],"artifacts.":[22],"Although":[23],"these":[24,31,140],"have":[26],"in-loop":[27,54],"filters":[28],"to":[29,39,91,142,181,206],"correct":[30],"distortions,":[32],"they":[33,95],"are":[34],"not":[35],"always":[36],"effective":[37],"due":[38],"the":[40,43,59,71,76,123,173,178,191,209,218,226],"complexity":[41],"of":[42,58,133,177,204],"noise.":[44],"Recently,":[45],"deep-learning":[46],"approaches":[47,61,150],"emerged":[48],"a":[50,85,110,134,153,168,197,245],"promising":[51],"solution":[52],"for":[53,65,208],"filtering.":[55],"However,":[56,94],"most":[57],"previous":[60,82,149],"were":[62],"designed":[63],"solely":[64],"learning":[66],"from":[67,121,148],"images":[68],"and":[69,88,126,129,221],"neglected":[70],"high-frequency":[72],"signals":[73],"present":[74],"in":[75,172],"reconstructed":[77],"frames.":[79],"Furthermore,":[80],"some":[81],"methods":[83],"employed":[84],"multi-level":[86],"feature-extraction":[87],"feature-fusion":[89,103,161],"strategy":[90],"enhance":[92],"performance.":[93,144],"utilized":[96],"complex":[97],"feature-extractors":[98],"while":[99],"relying":[100],"on":[101],"naive":[102],"methods.":[104,224],"In":[105],"this":[106],"article,":[107],"we":[108],"propose":[109],"novel":[111],"framework":[112],"called":[113],"<italic":[114,164,193,228,241],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[115,165,194,229,242],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">TSF-Net</i>":[116,166,195,230,243],",":[117],"which":[118],"jointly":[119],"learns":[120],"both":[122,139],"pixel":[124],"(spatial)":[125],"frequency-decomposed":[127],"information":[128,141],"through":[130],"powerful":[131],"capability":[132],"channel-wise":[135,179,234,247],"transformer,":[136],"it":[137,183],"fuses":[138],"improve":[143],"Our":[145,186],"approach":[146],"deviates":[147],"by":[151],"employing":[152],"simple":[154],"feature-extractor":[155],"coupled":[156],"with":[157,231,244],"an":[158,232],"advanced":[159],"transformer-based":[160],"module.":[162],"Simultaneously,":[163],"few":[169],"fundamental":[170],"modifications":[171],"multi-head":[174],"self-attention":[175],"module":[176],"transformer":[180,235],"make":[182],"computationally":[184],"efficient.":[185],"experimental":[187],"results":[188],"show":[189],"that":[190],"proposed":[192,227],"achieves":[196],"Bj\u00f8ntegaard":[198],"Delta":[199],"(BD)":[200],"-":[201],"bitrate":[202],"saving":[203],"up":[205],"10.258%":[207],"luma":[210],"(Y)":[211],"component":[212],"under":[213],"all-intra":[214],"(AI)":[215],"profile":[216],"outperforming":[217],"VVC":[219],"baseline":[220],"other":[222],"state-of-the-art":[223],"Moreover,":[225],"efficient":[233,239],"is":[236],"twice":[237],"vanilla":[246],"transformer.":[248]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":11}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
