{"id":"https://openalex.org/W7127975605","doi":"https://doi.org/10.48550/arxiv.2602.03906","title":"GeoIB: Geometry-Aware Information Bottleneck via Statistical-Manifold Compression","display_name":"GeoIB: Geometry-Aware Information Bottleneck via Statistical-Manifold Compression","publication_year":2026,"publication_date":"2026-02-03","ids":{"openalex":"https://openalex.org/W7127975605","doi":"https://doi.org/10.48550/arxiv.2602.03906"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.03906","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125114669","display_name":"Weiqi Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wang, Weiqi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059567156","display_name":"Zhiyi Tian","orcid":"https://orcid.org/0000-0001-8905-0941"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tian, Zhiyi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125168204","display_name":"Chenhan Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Chenhan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125110420","display_name":"Shui Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Shui","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5125114669"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.38359999656677246,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.38359999656677246,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.34549999237060547,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.0689999982714653,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/information-bottleneck-method","display_name":"Information bottleneck method","score":0.8370000123977661},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.6029999852180481},{"id":"https://openalex.org/keywords/geodesic","display_name":"Geodesic","score":0.5462999939918518},{"id":"https://openalex.org/keywords/mutual-information","display_name":"Mutual information","score":0.5425999760627747},{"id":"https://openalex.org/keywords/upper-and-lower-bounds","display_name":"Upper and lower bounds","score":0.5127999782562256},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.4494999945163727},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.43140000104904175},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.41749998927116394},{"id":"https://openalex.org/keywords/compression","display_name":"Compression (physics)","score":0.3695000112056732},{"id":"https://openalex.org/keywords/information-theory","display_name":"Information theory","score":0.36809998750686646}],"concepts":[{"id":"https://openalex.org/C60008888","wikidata":"https://www.wikidata.org/wiki/Q6031013","display_name":"Information bottleneck method","level":3,"score":0.8370000123977661},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.6029999852180481},{"id":"https://openalex.org/C165818556","wikidata":"https://www.wikidata.org/wiki/Q213488","display_name":"Geodesic","level":2,"score":0.5462999939918518},{"id":"https://openalex.org/C152139883","wikidata":"https://www.wikidata.org/wiki/Q252973","display_name":"Mutual information","level":2,"score":0.5425999760627747},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.5238000154495239},{"id":"https://openalex.org/C77553402","wikidata":"https://www.wikidata.org/wiki/Q13222579","display_name":"Upper and lower bounds","level":2,"score":0.5127999782562256},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.49390000104904175},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.4494999945163727},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.43140000104904175},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.41749998927116394},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.38019999861717224},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.3695000112056732},{"id":"https://openalex.org/C52622258","wikidata":"https://www.wikidata.org/wiki/Q131222","display_name":"Information theory","level":2,"score":0.36809998750686646},{"id":"https://openalex.org/C79772020","wikidata":"https://www.wikidata.org/wiki/Q5159264","display_name":"Conditional independence","level":2,"score":0.34290000796318054},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3409000039100647},{"id":"https://openalex.org/C35651441","wikidata":"https://www.wikidata.org/wiki/Q625303","display_name":"Independence (probability theory)","level":2,"score":0.31279999017715454},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.3111000061035156},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.31029999256134033},{"id":"https://openalex.org/C207390915","wikidata":"https://www.wikidata.org/wiki/Q1230525","display_name":"Divergence (linguistics)","level":2,"score":0.3091000020503998},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.2937999963760376},{"id":"https://openalex.org/C147764199","wikidata":"https://www.wikidata.org/wiki/Q6865248","display_name":"Minification","level":2,"score":0.2897999882698059},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.28870001435279846},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.28610000014305115},{"id":"https://openalex.org/C39927690","wikidata":"https://www.wikidata.org/wiki/Q11197","display_name":"Logarithm","level":2,"score":0.27959999442100525},{"id":"https://openalex.org/C191795146","wikidata":"https://www.wikidata.org/wiki/Q3878446","display_name":"Norm (philosophy)","level":2,"score":0.2768999934196472},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.26840001344680786},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.26339998841285706},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.2628999948501587},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.26260000467300415},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.260699987411499},{"id":"https://openalex.org/C109546454","wikidata":"https://www.wikidata.org/wiki/Q3798604","display_name":"Information geometry","level":4,"score":0.2563999891281128},{"id":"https://openalex.org/C17825722","wikidata":"https://www.wikidata.org/wiki/Q17285","display_name":"Plane (geometry)","level":2,"score":0.2531999945640564},{"id":"https://openalex.org/C153207627","wikidata":"https://www.wikidata.org/wiki/Q863873","display_name":"Code word","level":3,"score":0.2508000135421753}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.03906","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.03906","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.03906","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.03906","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Information":[0],"Bottleneck":[1],"(IB)":[2],"is":[3,11,124,169,229],"widely":[4],"used,":[5],"but":[6],"in":[7,195],"deep":[8],"learning,":[9],"it":[10],"usually":[12],"implemented":[13],"through":[14,55],"tractable":[15],"surrogates,":[16],"such":[17],"as":[18,85],"variational":[19],"bounds":[20],"or":[21],"neural":[22],"mutual":[23,71],"information":[24,59,72,105,197],"(MI)":[25,73],"estimators,":[26],"rather":[27],"than":[28,199],"directly":[29],"controlling":[30],"the":[31,52,56,91,148,158,164,173,183,196,200],"MI":[32],"I(X;Z)":[33,78],"itself.":[34],"The":[35,224],"looseness":[36],"and":[37,47,61,79,123,126,161,180,192,210,216],"estimator-dependent":[38],"bias":[39],"can":[40],"make":[41],"IB":[42,53,202],"\"compression\"":[43],"only":[44],"indirectly":[45],"controlled":[46],"optimization":[48,211],"fragile.":[49],"We":[50,75,150,176],"revisit":[51],"problem":[54],"lens":[57],"of":[58,147,227],"geometry":[60],"propose":[62],"a":[63,112,128,135,153,186,220],"\\textbf{Geo}metric":[64],"\\textbf{I}nformation":[65],"\\textbf{B}ottleneck":[66],"(\\textbf{GeoIB})":[67],"that":[68,77,133,163,182],"dispenses":[69],"with":[70,107,157],"estimation.":[74],"show":[76],"I(Z;Y)":[80],"admit":[81],"exact":[82],"projection":[83],"forms":[84],"minimal":[86],"Kullback-Leibler":[87],"(KL)":[88],"distances":[89],"from":[90],"joint":[92],"distributions":[93],"to":[94,120,172],"their":[95],"respective":[96],"independence":[97],"manifolds.":[98],"Guided":[99],"by":[100,142,213],"this":[101],"view,":[102],"GeoIB":[103,184,207,228],"controls":[104],"compression":[106,193],"two":[108],"complementary":[109],"terms:":[110],"(i)":[111],"distribution-level":[113],"Fisher-Rao":[114],"(FR)":[115],"discrepancy,":[116],"which":[117],"matches":[118],"KL":[119],"second":[121],"order":[122],"reparameterization-invariant;":[125],"(ii)":[127],"geometry-level":[129],"Jacobian-Frobenius":[130],"(JF)":[131],"term":[132],"provides":[134],"local":[136],"capacity-type":[137],"upper":[138],"bound":[139],"on":[140,204],"I(Z;X)":[141],"penalizing":[143],"pullback":[144],"volume":[145],"expansion":[146],"encoder.":[149],"further":[151],"derive":[152],"natural-gradient":[154,167],"optimizer":[155],"consistent":[156],"FR":[159],"metric":[160],"prove":[162],"standard":[165],"additive":[166],"step":[168],"first-order":[170],"equivalent":[171],"geodesic":[174],"update.":[175],"conducted":[177],"extensive":[178],"experiments":[179],"observed":[181],"achieves":[185],"better":[187],"trade-off":[188],"between":[189],"prediction":[190],"accuracy":[191],"ratio":[194],"plane":[198],"mainstream":[201],"baselines":[203],"popular":[205],"datasets.":[206],"improves":[208],"invariance":[209],"stability":[212],"unifying":[214],"distributional":[215],"geometric":[217],"regularization":[218],"under":[219],"single":[221],"bottleneck":[222],"multiplier.":[223],"source":[225],"code":[226],"released":[230],"at":[231],"\"https://anonymous.4open.science/r/G-IB-0569\".":[232]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-07T00:00:00"}
