{"id":"https://openalex.org/W4416799095","doi":"https://doi.org/10.1109/apsipaasc65261.2025.11248974","title":"Accelerating VVC Inter-Frame Coding: A Lightweight CNN for Fast QTMT Partitioning","display_name":"Accelerating VVC Inter-Frame Coding: A Lightweight CNN for Fast QTMT Partitioning","publication_year":2025,"publication_date":"2025-10-22","ids":{"openalex":"https://openalex.org/W4416799095","doi":"https://doi.org/10.1109/apsipaasc65261.2025.11248974"},"language":null,"primary_location":{"id":"doi:10.1109/apsipaasc65261.2025.11248974","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc65261.2025.11248974","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Jui-Chen Luo","orcid":null},"institutions":[{"id":"https://openalex.org/I154864474","display_name":"National Taiwan University of Science and Technology","ror":"https://ror.org/00q09pe49","country_code":"TW","type":"education","lineage":["https://openalex.org/I154864474"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Jui-Chen Luo","raw_affiliation_strings":["National Taiwan University of Science and Technology"],"affiliations":[{"raw_affiliation_string":"National Taiwan University of Science and Technology","institution_ids":["https://openalex.org/I154864474"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076112850","display_name":"Jiann\u2010Jone Chen","orcid":"https://orcid.org/0000-0002-3519-1594"},"institutions":[{"id":"https://openalex.org/I154864474","display_name":"National Taiwan University of Science and Technology","ror":"https://ror.org/00q09pe49","country_code":"TW","type":"education","lineage":["https://openalex.org/I154864474"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Jiann-Jone Chen","raw_affiliation_strings":["National Taiwan University of Science and Technology"],"affiliations":[{"raw_affiliation_string":"National Taiwan University of Science and Technology","institution_ids":["https://openalex.org/I154864474"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103177987","display_name":"Tien-Ying Kuo","orcid":"https://orcid.org/0000-0001-9831-5622"},"institutions":[{"id":"https://openalex.org/I118292597","display_name":"National Taipei University of Technology","ror":"https://ror.org/00cn92c09","country_code":"TW","type":"education","lineage":["https://openalex.org/I118292597"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Tien-Ying Kuo","raw_affiliation_strings":["National Taipei University of Technology"],"affiliations":[{"raw_affiliation_string":"National Taipei University of Technology","institution_ids":["https://openalex.org/I118292597"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101703487","display_name":"Yifan Wu","orcid":"https://orcid.org/0000-0002-3832-6618"},"institutions":[{"id":"https://openalex.org/I154864474","display_name":"National Taiwan University of Science and Technology","ror":"https://ror.org/00q09pe49","country_code":"TW","type":"education","lineage":["https://openalex.org/I154864474"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Yi-Fan Wu","raw_affiliation_strings":["National Taiwan University of Science and Technology"],"affiliations":[{"raw_affiliation_string":"National Taiwan University of Science and Technology","institution_ids":["https://openalex.org/I154864474"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5007665478","display_name":"K. Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I154864474","display_name":"National Taiwan University of Science and Technology","ror":"https://ror.org/00q09pe49","country_code":"TW","type":"education","lineage":["https://openalex.org/I154864474"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Kai-Jie Zhang","raw_affiliation_strings":["National Taiwan University of Science and Technology"],"affiliations":[{"raw_affiliation_string":"National Taiwan University of Science and Technology","institution_ids":["https://openalex.org/I154864474"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I154864474"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.43840524,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"2459","last_page":"2464"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10741","display_name":"Video Coding and Compression Technologies","score":0.982699990272522,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10741","display_name":"Video Coding and Compression Technologies","score":0.982699990272522,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.006500000134110451,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.0038999998942017555,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.6133000254631042},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.5956000089645386},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.5070000290870667},{"id":"https://openalex.org/keywords/context-adaptive-binary-arithmetic-coding","display_name":"Context-adaptive binary arithmetic coding","score":0.4596000015735626},{"id":"https://openalex.org/keywords/coding-tree-unit","display_name":"Coding tree unit","score":0.43860000371932983},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.4320000112056732},{"id":"https://openalex.org/keywords/algorithmic-efficiency","display_name":"Algorithmic efficiency","score":0.4311999976634979},{"id":"https://openalex.org/keywords/random-access","display_name":"Random access","score":0.4189000129699707},{"id":"https://openalex.org/keywords/bit-rate","display_name":"Bit rate","score":0.3903000056743622}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7519000172615051},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.6133000254631042},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.5956000089645386},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.5070000290870667},{"id":"https://openalex.org/C175732694","wikidata":"https://www.wikidata.org/wiki/Q1128713","display_name":"Context-adaptive binary arithmetic coding","level":3,"score":0.4596000015735626},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.4546000063419342},{"id":"https://openalex.org/C190750250","wikidata":"https://www.wikidata.org/wiki/Q13533439","display_name":"Coding tree unit","level":3,"score":0.43860000371932983},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.4320000112056732},{"id":"https://openalex.org/C116709606","wikidata":"https://www.wikidata.org/wiki/Q1296251","display_name":"Algorithmic efficiency","level":3,"score":0.4311999976634979},{"id":"https://openalex.org/C101722063","wikidata":"https://www.wikidata.org/wiki/Q218825","display_name":"Random access","level":2,"score":0.4189000129699707},{"id":"https://openalex.org/C2987812609","wikidata":"https://www.wikidata.org/wiki/Q194158","display_name":"Bit rate","level":2,"score":0.3903000056743622},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3901999890804291},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.364300012588501},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.36410000920295715},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.35910001397132874},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.3319000005722046},{"id":"https://openalex.org/C169805256","wikidata":"https://www.wikidata.org/wiki/Q1361381","display_name":"Transform coding","level":4,"score":0.32589998841285706},{"id":"https://openalex.org/C163797641","wikidata":"https://www.wikidata.org/wiki/Q2067937","display_name":"Tree structure","level":3,"score":0.3237999975681305},{"id":"https://openalex.org/C10161872","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Motion estimation","level":2,"score":0.305400013923645},{"id":"https://openalex.org/C25797200","wikidata":"https://www.wikidata.org/wiki/Q828137","display_name":"Compression ratio","level":3,"score":0.28769999742507935},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.27320000529289246},{"id":"https://openalex.org/C117896860","wikidata":"https://www.wikidata.org/wiki/Q11376","display_name":"Acceleration","level":2,"score":0.2709999978542328},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.27059999108314514},{"id":"https://openalex.org/C151416825","wikidata":"https://www.wikidata.org/wiki/Q934791","display_name":"Quadtree","level":2,"score":0.2702000141143799},{"id":"https://openalex.org/C2221639","wikidata":"https://www.wikidata.org/wiki/Q2877","display_name":"Discrete cosine transform","level":3,"score":0.2623000144958496},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2599000036716461},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.25619998574256897}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apsipaasc65261.2025.11248974","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc65261.2025.11248974","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W2963163009","https://openalex.org/W3002658862","https://openalex.org/W3035784627","https://openalex.org/W3153617831","https://openalex.org/W3157739744","https://openalex.org/W3170633153","https://openalex.org/W3202918664","https://openalex.org/W4285035674","https://openalex.org/W4304465124","https://openalex.org/W4308210855","https://openalex.org/W4308235895","https://openalex.org/W4312097398","https://openalex.org/W4388240329"],"related_works":[],"abstract_inverted_index":{"The":[0],"H.266/Versatile":[1],"Video":[2],"Coding":[3],"(VVC)":[4],"standard":[5],"offers":[6],"<tex":[7,20,142,162],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[8,21,143,163],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathbf{3":[9,144],"0":[10,12,153],"\\%}-\\mathbf{5":[11],"\\%}$</tex>":[13,154],"higher":[14,45],"compression":[15],"efficiency":[16],"than":[17,80],"its":[18],"predecessor,":[19],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathbf{H.":[22],"2":[23,152],"6":[24,166],"5}":[25],"/":[26],"\\mathbf{H":[27],"E":[28],"V":[29],"C}$</tex>,":[30],"while":[31,123],"maintaining":[32,124],"comparable":[33],"visual":[34],"quality.":[35],"However,":[36],"this":[37,86],"improvement":[38],"comes":[39],"at":[40],"the":[41,132,181],"cost":[42],"of":[43,82],"substantially":[44],"computational":[46],"complexity,":[47,190],"posing":[48],"challenges":[49],"for":[50],"real-time":[51,195],"encoding.":[52],"In":[53],"particular,":[54],"VVC's":[55],"Quad-Tree":[56],"plus":[57],"Multi-type":[58],"Tree":[59],"(QTMT)":[60],"block":[61],"partitioning,":[62],"high-precision":[63],"motion":[64],"compensation,":[65],"and":[66,113,204],"multi-directional":[67],"prediction":[68,102],"contribute":[69],"to":[70,76,110],"encoding":[71,157,189],"times":[72,78],"that":[73,104,138,180],"are":[74],"8":[75],"10":[77],"longer":[79],"those":[81],"HEVC.":[83],"To":[84],"address":[85],"issue,":[87],"we":[88],"propose":[89],"a":[90,95,100,125,141,161],"lightweight,":[91],"adaptive":[92],"information":[93],"(LAI-CNN),":[94],"compact":[96,126],"CNN-based":[97],"model":[98,127],"featuring":[99],"three-stage":[101],"scheme":[103],"integrates":[105],"VVC":[106,188],"inter-coding":[107],"structure":[108],"constraints":[109],"make":[111],"fast":[112],"accurate":[114],"QTMT":[115],"partitioning":[116],"decisions,":[117],"thereby":[118],"reducing":[119],"redundant":[120],"RDO":[121],"operations":[122],"architecture.":[128],"Experimental":[129],"results":[130,178],"under":[131],"VTM22.0":[133],"Random":[134],"Access":[135],"configuration":[136],"show":[137],"LAI-CNN":[139],"achieves":[140],"6.":[145],"3":[146,165],"5":[147],"\\%":[148,167],"-":[149],"4":[150],"9.":[151],"reduction":[155],"in":[156,171,194],"time,":[158],"with":[159],"only":[160],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathbf{1.":[164],"-}$</tex>":[168],"3.48%":[169],"increase":[170],"Bj\u00f8ntegaard":[172],"Delta":[173],"Bit":[174],"Rate":[175],"(BDBR).":[176],"These":[177],"demonstrate":[179],"proposed":[182],"coding":[183],"acceleration":[184],"framework":[185],"significantly":[186],"reduces":[187],"enabling":[191],"practical":[192],"deployment":[193],"scenarios":[196],"such":[197],"as":[198],"live":[199],"streaming,":[200],"interactive":[201],"video":[202],"services,":[203],"cloud-based":[205],"processing.":[206]},"counts_by_year":[],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-11-28T00:00:00"}
