{"id":"https://openalex.org/W4407131706","doi":"https://doi.org/10.48550/arxiv.2502.01189","title":"Compressed Image Generation with Denoising Diffusion Codebook Models","display_name":"Compressed Image Generation with Denoising Diffusion Codebook Models","publication_year":2025,"publication_date":"2025-02-03","ids":{"openalex":"https://openalex.org/W4407131706","doi":"https://doi.org/10.48550/arxiv.2502.01189"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2502.01189","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2502.01189","pdf_url":"https://arxiv.org/pdf/2502.01189","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2502.01189","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030762660","display_name":"Guy Ohayon","orcid":"https://orcid.org/0009-0008-5112-6558"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ohayon, Guy","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008678260","display_name":"H Manor","orcid":"https://orcid.org/0009-0007-6851-148X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Manor, Hila","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058178036","display_name":"Tomer Michaeli","orcid":"https://orcid.org/0000-0003-0525-8054"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Michaeli, Tomer","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5020279598","display_name":"Michael Elad","orcid":"https://orcid.org/0000-0001-8131-6928"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Elad, Michael","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5030762660"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.9437000155448914,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.9437000155448914,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10688","display_name":"Image and Signal Denoising Methods","score":0.9241999983787537,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/codebook","display_name":"Codebook","score":0.8601229786872864},{"id":"https://openalex.org/keywords/image-denoising","display_name":"Image denoising","score":0.6158478260040283},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5574780702590942},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.5563896894454956},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5397255420684814},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.5397053956985474},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.45870837569236755},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.43915605545043945},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.38293662667274475},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.10333523154258728}],"concepts":[{"id":"https://openalex.org/C127759330","wikidata":"https://www.wikidata.org/wiki/Q637416","display_name":"Codebook","level":2,"score":0.8601229786872864},{"id":"https://openalex.org/C2983327147","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Image denoising","level":3,"score":0.6158478260040283},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5574780702590942},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.5563896894454956},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5397255420684814},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.5397053956985474},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.45870837569236755},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.43915605545043945},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.38293662667274475},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.10333523154258728},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2502.01189","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2502.01189","pdf_url":"https://arxiv.org/pdf/2502.01189","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2502.01189","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2502.01189","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2502.01189","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2502.01189","pdf_url":"https://arxiv.org/pdf/2502.01189","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2087258800","https://openalex.org/W2810018092","https://openalex.org/W2387428419","https://openalex.org/W4401571043","https://openalex.org/W2098237619","https://openalex.org/W1974034585","https://openalex.org/W4406054402","https://openalex.org/W4312627788","https://openalex.org/W2353444452","https://openalex.org/W2001438600"],"abstract_inverted_index":{"We":[0,77],"present":[1],"a":[2,39,90,98,149,160],"novel":[3],"generative":[4,95],"approach":[5],"based":[6],"on":[7],"Denoising":[8,59],"Diffusion":[9,60],"Models":[10],"(DDMs),":[11],"which":[12],"produces":[13],"high-quality":[14],"image":[15,102,107,126,130],"samples":[16,43],"along":[17],"with":[18,38,139,162],"their":[19,140],"losslessly":[20],"compressed":[21,155],"bit-stream":[22,142],"representations.":[23,143],"This":[24],"is":[25,146],"obtained":[26],"by":[27,112,148],"replacing":[28],"the":[29,35,82,85,133,153,169],"standard":[30,70],"Gaussian":[31,50],"noise":[32,42,115],"sampling":[33],"in":[34],"reverse":[36],"diffusion":[37],"selection":[40],"of":[41,47,69,152,165],"from":[44,84],"pre-defined":[45],"codebooks":[46,86],"fixed":[48],"iid":[49],"vectors.":[51],"Surprisingly,":[52],"we":[53,118],"find":[54],"that":[55,87],"our":[56,94,120],"method,":[57],"termed":[58],"Codebook":[61],"Model":[62],"(DDCM),":[63],"retains":[64],"sample":[65],"quality":[66],"and":[67,80],"diversity":[68],"DDMs,":[71],"even":[72],"for":[73,168],"extremely":[74],"small":[75],"codebooks.":[76],"leverage":[78],"DDCM":[79],"pick":[81],"noises":[83],"best":[88],"match":[89],"given":[91],"image,":[92],"converting":[93],"model":[96],"into":[97],"highly":[99],"effective":[100],"lossy":[101],"codec":[103],"achieving":[104],"state-of-the-art":[105],"perceptual":[106],"compression":[108,121],"results.":[109],"More":[110],"generally,":[111],"setting":[113],"other":[114],"selections":[116],"rules,":[117],"extend":[119],"method":[122],"to":[123],"any":[124],"conditional":[125,156],"generation":[127,157],"task":[128],"(e.g.,":[129],"restoration),":[131],"where":[132],"generated":[134],"images":[135],"are":[136],"produced":[137],"jointly":[138],"condensed":[141],"Our":[144],"work":[145],"accompanied":[147],"mathematical":[150],"interpretation":[151],"proposed":[154],"schemes,":[158],"establishing":[159],"connection":[161],"score-based":[163],"approximations":[164],"posterior":[166],"samplers":[167],"tasks":[170],"considered.":[171]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
