{"id":"https://openalex.org/W3117007398","doi":"https://doi.org/10.1109/vcip49819.2020.9301828","title":"Learned image and video compression with deep neural networks","display_name":"Learned image and video compression with deep neural networks","publication_year":2020,"publication_date":"2020-12-01","ids":{"openalex":"https://openalex.org/W3117007398","doi":"https://doi.org/10.1109/vcip49819.2020.9301828","mag":"3117007398"},"language":"en","primary_location":{"id":"doi:10.1109/vcip49819.2020.9301828","is_oa":false,"landing_page_url":"https://doi.org/10.1109/vcip49819.2020.9301828","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE International Conference on Visual Communications and Image Processing (VCIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5051590556","display_name":"Dong-Hui Xu","orcid":"https://orcid.org/0000-0002-8307-3613"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Dong Xu","raw_affiliation_strings":["School of Electrical and Information Engineering, The University of Sydney, Australia"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, The University of Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086398934","display_name":"Guo Lu","orcid":"https://orcid.org/0000-0001-6951-0090"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Guo Lu","raw_affiliation_strings":["School of Electrical and Information Engineering, The University of Sydney, Australia"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, The University of Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082999550","display_name":"Ren Yang","orcid":"https://orcid.org/0000-0003-4124-4186"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Ren Yang","raw_affiliation_strings":["School of Electrical and Information Engineering, The University of Sydney, Australia"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, The University of Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052236177","display_name":"Radu Timofte","orcid":"https://orcid.org/0000-0002-1478-0402"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Radu Timofte","raw_affiliation_strings":["School of Electrical and Information Engineering, The University of Sydney, Australia"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, The University of Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5051590556"],"corresponding_institution_ids":["https://openalex.org/I129604602"],"apc_list":null,"apc_paid":null,"fwci":1.1724,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.81746992,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10741","display_name":"Video Coding and Compression Technologies","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8100485801696777},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.7129263281822205},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6276164650917053},{"id":"https://openalex.org/keywords/image-compression","display_name":"Image compression","score":0.6272776126861572},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.6086305975914001},{"id":"https://openalex.org/keywords/motion-compensation","display_name":"Motion compensation","score":0.4527837932109833},{"id":"https://openalex.org/keywords/compression-artifact","display_name":"Compression artifact","score":0.4443276524543762},{"id":"https://openalex.org/keywords/video-compression-picture-types","display_name":"Video compression picture types","score":0.4292139410972595},{"id":"https://openalex.org/keywords/jpeg","display_name":"JPEG","score":0.42898663878440857},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.41563594341278076},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3319207727909088},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.31953805685043335},{"id":"https://openalex.org/keywords/video-processing","display_name":"Video processing","score":0.2853604853153229},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.25950539112091064},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.08368971943855286}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8100485801696777},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.7129263281822205},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6276164650917053},{"id":"https://openalex.org/C13481523","wikidata":"https://www.wikidata.org/wiki/Q412438","display_name":"Image compression","level":4,"score":0.6272776126861572},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.6086305975914001},{"id":"https://openalex.org/C128840427","wikidata":"https://www.wikidata.org/wiki/Q1302174","display_name":"Motion compensation","level":2,"score":0.4527837932109833},{"id":"https://openalex.org/C57654395","wikidata":"https://www.wikidata.org/wiki/Q1097775","display_name":"Compression artifact","level":5,"score":0.4443276524543762},{"id":"https://openalex.org/C106030495","wikidata":"https://www.wikidata.org/wiki/Q1797012","display_name":"Video compression picture types","level":4,"score":0.4292139410972595},{"id":"https://openalex.org/C198751489","wikidata":"https://www.wikidata.org/wiki/Q2195","display_name":"JPEG","level":3,"score":0.42898663878440857},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.41563594341278076},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3319207727909088},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.31953805685043335},{"id":"https://openalex.org/C65483669","wikidata":"https://www.wikidata.org/wiki/Q3536669","display_name":"Video processing","level":2,"score":0.2853604853153229},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.25950539112091064},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.08368971943855286}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/vcip49819.2020.9301828","is_oa":false,"landing_page_url":"https://doi.org/10.1109/vcip49819.2020.9301828","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE International Conference on Visual Communications and Image Processing (VCIP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","score":0.550000011920929,"display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2187171999","https://openalex.org/W3109737331","https://openalex.org/W3016393364","https://openalex.org/W2962930383","https://openalex.org/W4287814353","https://openalex.org/W43054317","https://openalex.org/W3162084246","https://openalex.org/W2807545779","https://openalex.org/W4247602681","https://openalex.org/W3210165700"],"abstract_inverted_index":{"This":[0],"tutorial":[1,194],"aims":[2],"at":[3],"reviewing":[4],"the":[5,9,22,45,49,66,70,79,85,109,123,142,146,159,198,204,215,221],"recent":[6,222],"progress":[7],"in":[8,65,108,135,224],"deep":[10,25,87,93,125],"learning":[11,26,88,126,170,206],"based":[12,54,95,171,207],"data":[13,46,80,165,189,200,209],"compression,":[14],"including":[15],"image":[16,40,129],"compression":[17,47,81,96,130,166,210],"and":[18,39,57,106,114,131,153,167,203],"video":[19,132],"compression.":[20,116,133,190],"In":[21,117,191],"past":[23],"years,":[24],"techniques":[27,127,202],"have":[28,98],"been":[29],"successfully":[30],"applied":[31],"to":[32,77],"a":[33],"large":[34],"number":[35],"of":[36,111],"computer":[37,112],"vision":[38,113],"processing":[41],"tasks.":[42],"However,":[43],"for":[44,128,145,163,187],"task,":[48],"traditional":[50,147,199],"approaches":[51,97],"(i.e.,":[52],"block":[53],"motion":[55,58],"estimation":[56],"compensation,":[59],"etc.)":[60],"are":[61],"still":[62],"widely":[63,182],"employed":[64],"mainstream":[67],"codecs.":[68],"Considering":[69],"powerful":[71],"representation":[72],"capability,":[73],"it":[74],"is":[75],"possible":[76],"improve":[78],"performance":[82],"by":[83],"employing":[84],"advanced":[86],"technologies.":[89],"To":[90],"this":[91,118,136,225],"end,":[92],"leaning":[94],"recently":[99],"received":[100],"significant":[101],"attention":[102],"from":[103],"both":[104,197],"academia":[105],"industry":[107],"field":[110],"image/video":[115],"tutorial,":[119,137],"we":[120,138,156,178],"will":[121,139,157,179,195,213],"introduce":[122,141],"related":[124],"Specifically,":[134],"first":[140],"basic":[143],"pipeline":[144],"codecs,":[148],"such":[149],"as":[150],"JPEG,":[151],"H.264":[152],"HEVC.":[154],"Then,":[155],"discuss":[158],"common":[160],"network":[161],"architectures":[162],"visual":[164,188,208],"analyse":[168],"different":[169,218],"entropy":[172],"models.":[173],"Based":[174],"on":[175],"these":[176],"techniques,":[177],"describe":[180],"several":[181],"used":[183],"end-to-end":[184],"optimized":[185],"frameworks":[186],"summary,":[192],"our":[193],"cover":[196],"coding":[201],"popular":[205],"algorithms,":[211],"which":[212],"help":[214],"audiences":[216],"with":[217],"backgrounds":[219],"learn":[220],"progresses":[223],"emerging":[226],"research":[227],"area.":[228]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
