{"id":"https://openalex.org/W4405974086","doi":"https://doi.org/10.1109/tip.2024.3522813","title":"Exploiting Latent Properties to Optimize Neural Codecs","display_name":"Exploiting Latent Properties to Optimize Neural Codecs","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4405974086","doi":"https://doi.org/10.1109/tip.2024.3522813","pmid":"https://pubmed.ncbi.nlm.nih.gov/40030757"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2024.3522813","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2024.3522813","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://hal.science/hal-04945981/document","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040784126","display_name":"Muhammet Balc\u0131lar","orcid":"https://orcid.org/0000-0003-1428-4297"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Muhammet Balcilar","raw_affiliation_strings":["InterDigital Inc., Cesson-S&#x00E9;vign&#x00E9;, France"],"raw_orcid":"https://orcid.org/0000-0003-1428-4297","affiliations":[{"raw_affiliation_string":"InterDigital Inc., Cesson-S&#x00E9;vign&#x00E9;, France","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020394666","display_name":"Bharath Bhushan Damodaran","orcid":"https://orcid.org/0000-0002-4466-017X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bharath Bhushan Damodaran","raw_affiliation_strings":["InterDigital Inc., Cesson-S&#x00E9;vign&#x00E9;, France"],"raw_orcid":"https://orcid.org/0000-0002-4466-017X","affiliations":[{"raw_affiliation_string":"InterDigital Inc., Cesson-S&#x00E9;vign&#x00E9;, France","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019525045","display_name":"Karam Naser","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Karam Naser","raw_affiliation_strings":["InterDigital Inc., Cesson-S&#x00E9;vign&#x00E9;, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"InterDigital Inc., Cesson-S&#x00E9;vign&#x00E9;, France","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077409267","display_name":"Franck Galpin","orcid":"https://orcid.org/0000-0003-2123-7819"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Franck Galpin","raw_affiliation_strings":["InterDigital Inc., Cesson-S&#x00E9;vign&#x00E9;, France"],"raw_orcid":"https://orcid.org/0000-0003-2123-7819","affiliations":[{"raw_affiliation_string":"InterDigital Inc., Cesson-S&#x00E9;vign&#x00E9;, France","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5041269156","display_name":"Pierre Hellier","orcid":"https://orcid.org/0000-0003-3603-2381"},"institutions":[{"id":"https://openalex.org/I56067802","display_name":"Universit\u00e9 de Rennes","ror":"https://ror.org/015m7wh34","country_code":"FR","type":"education","lineage":["https://openalex.org/I56067802"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Pierre Hellier","raw_affiliation_strings":["University of Rennes, Rennes, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Rennes, Rennes, France","institution_ids":["https://openalex.org/I56067802"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0015204,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"34","issue":null,"first_page":"306","last_page":"319"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/codec","display_name":"Codec","score":0.8143309354782104},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7617635726928711},{"id":"https://openalex.org/keywords/vector-quantization","display_name":"Vector quantization","score":0.6337146759033203},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.5462162494659424},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.5139805674552917},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5079794526100159},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.47008657455444336},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44387513399124146},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.4323784112930298},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3689712882041931},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.0817585289478302}],"concepts":[{"id":"https://openalex.org/C161765866","wikidata":"https://www.wikidata.org/wiki/Q184748","display_name":"Codec","level":2,"score":0.8143309354782104},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7617635726928711},{"id":"https://openalex.org/C199833920","wikidata":"https://www.wikidata.org/wiki/Q612536","display_name":"Vector quantization","level":2,"score":0.6337146759033203},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.5462162494659424},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.5139805674552917},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5079794526100159},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.47008657455444336},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44387513399124146},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.4323784112930298},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3689712882041931},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0817585289478302},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tip.2024.3522813","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2024.3522813","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:40030757","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40030757","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null},{"id":"pmh:oai:HAL:hal-04945981v1","is_oa":true,"landing_page_url":"https://hal.science/hal-04945981","pdf_url":"https://hal.science/hal-04945981/document","source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Transactions on Image Processing, 2025, IEEE transactions on image processing, 34, pp.306 - 319. &#x27E8;10.1109/tip.2024.3522813&#x27E9;","raw_type":"Journal articles"}],"best_oa_location":{"id":"pmh:oai:HAL:hal-04945981v1","is_oa":true,"landing_page_url":"https://hal.science/hal-04945981","pdf_url":"https://hal.science/hal-04945981/document","source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Transactions on Image Processing, 2025, IEEE transactions on image processing, 34, pp.306 - 319. &#x27E8;10.1109/tip.2024.3522813&#x27E9;","raw_type":"Journal articles"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4405974086.pdf"},"referenced_works_count":58,"referenced_works":["https://openalex.org/W1634005169","https://openalex.org/W1933799648","https://openalex.org/W2001968606","https://openalex.org/W2024470753","https://openalex.org/W2040336387","https://openalex.org/W2060727197","https://openalex.org/W2119352491","https://openalex.org/W2137983211","https://openalex.org/W2140940105","https://openalex.org/W2142228262","https://openalex.org/W2493109494","https://openalex.org/W2552465432","https://openalex.org/W2785562966","https://openalex.org/W2962676454","https://openalex.org/W2969260367","https://openalex.org/W2987947587","https://openalex.org/W3010533237","https://openalex.org/W3031546776","https://openalex.org/W3034469748","https://openalex.org/W3035195755","https://openalex.org/W3091266734","https://openalex.org/W3092877102","https://openalex.org/W3095497211","https://openalex.org/W3097448661","https://openalex.org/W3098284407","https://openalex.org/W3110286842","https://openalex.org/W3120355627","https://openalex.org/W3175457126","https://openalex.org/W3203234039","https://openalex.org/W3206996732","https://openalex.org/W4206355076","https://openalex.org/W4206364355","https://openalex.org/W4214761665","https://openalex.org/W4226355936","https://openalex.org/W4283377204","https://openalex.org/W4285069933","https://openalex.org/W4285483958","https://openalex.org/W4287605633","https://openalex.org/W4294567867","https://openalex.org/W4311415873","https://openalex.org/W4312597589","https://openalex.org/W4317555471","https://openalex.org/W4386071691","https://openalex.org/W4386075611","https://openalex.org/W4386076451","https://openalex.org/W4386598475","https://openalex.org/W6640455647","https://openalex.org/W6675207249","https://openalex.org/W6734035190","https://openalex.org/W6741057705","https://openalex.org/W6754634825","https://openalex.org/W6758867260","https://openalex.org/W6763486759","https://openalex.org/W6778914582","https://openalex.org/W6779775157","https://openalex.org/W6784858424","https://openalex.org/W6793364766","https://openalex.org/W6802036239"],"related_works":["https://openalex.org/W2964213236","https://openalex.org/W2163719598","https://openalex.org/W3161919736","https://openalex.org/W2387018512","https://openalex.org/W2107680156","https://openalex.org/W3209251257","https://openalex.org/W2094714038","https://openalex.org/W2039662546","https://openalex.org/W2144404403","https://openalex.org/W2106967209"],"abstract_inverted_index":{"End-to-end":[0],"image":[1],"and":[2,42,67,89],"video":[3],"codecs":[4,26,57],"are":[5],"becoming":[6],"increasingly":[7],"competitive,":[8],"compared":[9],"to":[10,38,49,82,92,122,158,172],"traditional":[11,31,193],"compression":[12,160],"techniques":[13],"that":[14,102,128,166],"have":[15,27],"been":[16],"developed":[17],"through":[18],"decades":[19],"of":[20,64,70,96,174],"manual":[21],"engineering":[22],"efforts.":[23],"These":[24],"trainable":[25],"many":[28],"advantages":[29],"over":[30,110],"techniques,":[32],"such":[33],"as":[34,155,197],"their":[35,50],"straightforward":[36],"adaptation":[37],"perceptual":[39],"distortion":[40],"metrics":[41],"high":[43],"performance":[44,95,109,195],"in":[45,74],"specific":[46],"fields":[47],"thanks":[48],"learning":[51],"ability.":[52],"However,":[53],"current":[54],"state-of-the-art":[55],"neural":[56],"do":[58],"not":[59,145],"fully":[60],"exploit":[61],"the":[62,68,71,94,129,134,139,148,153,175,178,187],"benefits":[63],"vector":[65,120],"quantization":[66,88,106,121],"existence":[69],"entropy":[72,90,130,188],"gradient":[73,189],"decoding":[75],"devices.":[76],"In":[77,185],"this":[78],"paper,":[79],"we":[80,100,126],"propose":[81],"leverage":[83],"these":[84,167],"two":[85],"properties":[86],"(vector":[87],"gradient)":[91],"improve":[93,108,123],"off-the-shelf":[97],"codecs.":[98],"Firstly,":[99],"demonstrate":[101],"using":[103,116],"non-uniform":[104],"scalar":[105],"cannot":[107],"uniform":[111,119],"quantization.":[112],"We":[113,150],"thus":[114],"suggest":[115],"predefined":[117],"optimal":[118],"performance.":[124,161],"Secondly,":[125],"show":[127,165],"gradient,":[131,142],"available":[132,146],"at":[133,147],"decoder,":[135],"is":[136,144],"correlated":[137],"with":[138],"reconstruction":[140],"error":[141],"which":[143],"decoder.":[149],"therefore":[151],"use":[152],"former":[154],"a":[156],"proxy":[157],"enhance":[159],"Our":[162],"experimental":[163],"results":[164],"approaches":[168],"save":[169],"between":[170],"1":[171],"3%":[173],"rate":[176],"for":[177],"same":[179],"quality":[180],"across":[181],"various":[182],"pre-trained":[183],"methods.":[184],"addition,":[186],"based":[190],"solution":[191],"improves":[192],"codec":[194],"significantly":[196],"well.":[198]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
