{"id":"https://openalex.org/W4313598801","doi":"https://doi.org/10.1109/jsait.2023.3234502","title":"Efficient Representation of Large-Alphabet Probability Distributions","display_name":"Efficient Representation of Large-Alphabet Probability Distributions","publication_year":2022,"publication_date":"2022-12-01","ids":{"openalex":"https://openalex.org/W4313598801","doi":"https://doi.org/10.1109/jsait.2023.3234502"},"language":"en","primary_location":{"id":"doi:10.1109/jsait.2023.3234502","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jsait.2023.3234502","pdf_url":null,"source":{"id":"https://openalex.org/S4210211895","display_name":"IEEE Journal on Selected Areas in Information Theory","issn_l":"2641-8770","issn":["2641-8770"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal on Selected Areas in Information Theory","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006903412","display_name":"Aviv Adler","orcid":"https://orcid.org/0000-0003-3698-7639"},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Aviv Adler","raw_affiliation_strings":["EECS Department, Massachusetts Institute of Technology, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"EECS Department, Massachusetts Institute of Technology, Cambridge, MA, USA","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071582967","display_name":"Jennifer Tang","orcid":"https://orcid.org/0000-0002-8369-7901"},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jennifer Tang","raw_affiliation_strings":["EECS Department, Massachusetts Institute of Technology, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"EECS Department, Massachusetts Institute of Technology, Cambridge, MA, USA","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031031216","display_name":"Yury Polyanskiy","orcid":null},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yury Polyanskiy","raw_affiliation_strings":["EECS Department, Massachusetts Institute of Technology, Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"EECS Department, Massachusetts Institute of Technology, Cambridge, MA, USA","institution_ids":["https://openalex.org/I63966007"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5006903412"],"corresponding_institution_ids":["https://openalex.org/I63966007"],"apc_list":null,"apc_paid":null,"fwci":0.7957,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.77405211,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"3","issue":"4","first_page":"651","last_page":"663"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11321","display_name":"Error Correcting Code Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.6565772294998169},{"id":"https://openalex.org/keywords/minimax","display_name":"Minimax","score":0.607865035533905},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.5921077132225037},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.5663982629776001},{"id":"https://openalex.org/keywords/bounded-function","display_name":"Bounded function","score":0.5256891250610352},{"id":"https://openalex.org/keywords/asymptotically-optimal-algorithm","display_name":"Asymptotically optimal algorithm","score":0.4987061023712158},{"id":"https://openalex.org/keywords/discrete-mathematics","display_name":"Discrete mathematics","score":0.494872510433197},{"id":"https://openalex.org/keywords/probability-distribution","display_name":"Probability distribution","score":0.47085827589035034},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.43920186161994934},{"id":"https://openalex.org/keywords/alphabet","display_name":"Alphabet","score":0.4147578775882721},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.2543875575065613},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.1264076828956604}],"concepts":[{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.6565772294998169},{"id":"https://openalex.org/C149728462","wikidata":"https://www.wikidata.org/wiki/Q751319","display_name":"Minimax","level":2,"score":0.607865035533905},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.5921077132225037},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.5663982629776001},{"id":"https://openalex.org/C34388435","wikidata":"https://www.wikidata.org/wiki/Q2267362","display_name":"Bounded function","level":2,"score":0.5256891250610352},{"id":"https://openalex.org/C181789720","wikidata":"https://www.wikidata.org/wiki/Q4812191","display_name":"Asymptotically optimal algorithm","level":2,"score":0.4987061023712158},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.494872510433197},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.47085827589035034},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.43920186161994934},{"id":"https://openalex.org/C112876837","wikidata":"https://www.wikidata.org/wiki/Q837518","display_name":"Alphabet","level":2,"score":0.4147578775882721},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.2543875575065613},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.1264076828956604},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/jsait.2023.3234502","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jsait.2023.3234502","pdf_url":null,"source":{"id":"https://openalex.org/S4210211895","display_name":"IEEE Journal on Selected Areas in Information Theory","issn_l":"2641-8770","issn":["2641-8770"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal on Selected Areas in Information Theory","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.6399999856948853,"id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G1332620490","display_name":null,"funder_award_id":"CCF-2131115","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320338294","display_name":"Air Force Research Laboratory","ror":"https://ror.org/02e2egq70"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W1576475658","https://openalex.org/W1686946872","https://openalex.org/W2001968606","https://openalex.org/W2004003571","https://openalex.org/W2018040777","https://openalex.org/W2068071220","https://openalex.org/W2085854859","https://openalex.org/W2089419199","https://openalex.org/W2103723258","https://openalex.org/W2127314673","https://openalex.org/W2132512523","https://openalex.org/W2138570191","https://openalex.org/W2142228262","https://openalex.org/W2171052652","https://openalex.org/W2963373550","https://openalex.org/W2963873929","https://openalex.org/W3130985436","https://openalex.org/W3198362564","https://openalex.org/W3198737060","https://openalex.org/W4288346545","https://openalex.org/W4388297583","https://openalex.org/W6637108112","https://openalex.org/W6675471587","https://openalex.org/W6680765659","https://openalex.org/W6763653508","https://openalex.org/W7018288791"],"related_works":["https://openalex.org/W2016058626","https://openalex.org/W2474724840","https://openalex.org/W2895916002","https://openalex.org/W1530911128","https://openalex.org/W1814049089","https://openalex.org/W2026003927","https://openalex.org/W2768147893","https://openalex.org/W3136967581","https://openalex.org/W2015073710","https://openalex.org/W2212806282"],"abstract_inverted_index":{"A":[0,46],"number":[1],"of":[2,20,24,72,102,111,210],"engineering":[3],"and":[4,9,59,97,144,148,161],"scientific":[5],"problems":[6],"require":[7],"representing":[8],"manipulating":[10],"probability":[11,175],"distributions":[12,176],"over":[13,177],"large":[14],"alphabets,":[15,99],"which":[16],"we":[17,155],"may":[18],"think":[19],"as":[21,170,222,226],"long":[22],"vectors":[23],"reals":[25],"summing":[26],"to":[27,35,50,62,84,114,118,130],"1.":[28],"In":[29],"some":[30],"cases":[31],"it":[32],"is":[33,49,168,221],"required":[34],"represent":[36],"such":[37,182],"a":[38,69,106,157,178,183,197],"vector":[39],"with":[40],"only":[41],"b":[42],"bits":[43],"per":[44],"entry.":[45],"natural":[47],"choice":[48],"partition":[51],"the":[52,100,126,164,202,206,211,218,227],"interval":[53],"0,1":[54],"into":[55],"2b":[56],"uniform":[57,213,228],"bins":[58],"quantize":[60],"entries":[61],"each":[63],"bin":[64],"independently.":[65],"We":[66],"show":[67,162],"that":[68,163,217],"minor":[70],"modification":[71],"this":[73],"procedure":[74],"\u2013":[75,86],"applying":[76],"an":[77,88],"entrywise":[78],"non-linear":[79],"function":[80],"(compander)":[81],"f(x)":[82],"prior":[83],"quantization":[85,91],"yields":[87],"extremely":[89],"effective":[90],"method.":[92],"For":[93],"example,":[94],"for":[95,136,149,173,187,201,224,230],"b=8(16)":[96],"105-sized":[98],"quality":[101],"representation":[103],"improves":[104,125],"from":[105,128],"loss":[107,127,192,204],"(under":[108],"KL":[109],"divergence)":[110],"0.5(0.1)":[112],"bits/entry":[113],"10-4(10-9)":[115,131],"bits/entry.":[116,132],"Compared":[117],"floating":[119],"point":[120],"representations,":[121],"our":[122],"compander":[123,166,184],"method":[124],"10-1(10-6)":[129],"These":[133],"numbers":[134],"hold":[135],"both":[137],"real-world":[138],"data":[139],"(word":[140],"frequencies":[141],"in":[142],"books":[143],"DNA":[145],"k-mer":[146],"counts)":[147],"synthetic":[150],"randomly":[151],"generated":[152],"distributions.":[153],"Theoretically,":[154],"analyze":[156],"minimax":[158,199],"optimality":[159,209],"criterion":[160,200],"closed-form":[165],"f(x)ArcSinh(cK(KlogK)x)":[167],"(asymptotically":[169],"b\u221e)":[171],"optimal":[172],"quantizing":[174],"-letter":[179],"alphabet.":[180],"Non-asymptotically,":[181],"(substituting":[185],"1/2":[186],"cfor":[188],"simplicity)":[189],"has":[190],"KL-quantization":[191],"bounded":[193],"by":[194],"\u22648\u22192-2blog2.":[195],"Interestingly,":[196],"similar":[198],"quadratic":[203,231],"on":[205],"hypercube":[207],"shows":[208],"standard":[212],"quantizer.":[214],"This":[215],"suggests":[216],"ArcSinh":[219],"quantizer":[220,229],"fundamental":[223],"KL-distortion":[225],"distortion.":[232]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
