{"id":"https://openalex.org/W4289655274","doi":"https://doi.org/10.1109/isit50566.2022.9834357","title":"Understanding Deep Neural Networks Using Sliced Mutual Information","display_name":"Understanding Deep Neural Networks Using Sliced Mutual Information","publication_year":2022,"publication_date":"2022-06-26","ids":{"openalex":"https://openalex.org/W4289655274","doi":"https://doi.org/10.1109/isit50566.2022.9834357"},"language":"en","primary_location":{"id":"doi:10.1109/isit50566.2022.9834357","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isit50566.2022.9834357","pdf_url":null,"source":{"id":"https://openalex.org/S4363604560","display_name":"2022 IEEE International Symposium on Information Theory (ISIT)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Symposium on Information Theory (ISIT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028245435","display_name":"Shelvia Wongso","orcid":"https://orcid.org/0009-0004-8465-1640"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Shelvia Wongso","raw_affiliation_strings":["National University of Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028037531","display_name":"Rohan Ghosh","orcid":"https://orcid.org/0000-0002-6728-1076"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Rohan Ghosh","raw_affiliation_strings":["National University of Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069355437","display_name":"Mehul Motani","orcid":"https://orcid.org/0000-0003-3262-0207"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Mehul Motani","raw_affiliation_strings":["National University of Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore","institution_ids":["https://openalex.org/I165932596"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5028245435"],"corresponding_institution_ids":["https://openalex.org/I165932596"],"apc_list":null,"apc_paid":null,"fwci":0.5194,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.62669683,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"133","last_page":"138"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9857000112533569,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12611","display_name":"Neural Networks and Reservoir Computing","score":0.9793000221252441,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6535975337028503},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6182131171226501},{"id":"https://openalex.org/keywords/mutual-information","display_name":"Mutual information","score":0.5553372502326965},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5465025305747986}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6535975337028503},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6182131171226501},{"id":"https://openalex.org/C152139883","wikidata":"https://www.wikidata.org/wiki/Q252973","display_name":"Mutual information","level":2,"score":0.5553372502326965},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5465025305747986}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/isit50566.2022.9834357","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isit50566.2022.9834357","pdf_url":null,"source":{"id":"https://openalex.org/S4363604560","display_name":"2022 IEEE International Symposium on Information Theory (ISIT)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Symposium on Information Theory (ISIT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320311687","display_name":"Ministry of Education","ror":"https://ror.org/03m01yf64"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W1686946872","https://openalex.org/W2008056655","https://openalex.org/W2092939357","https://openalex.org/W2099111195","https://openalex.org/W2114771311","https://openalex.org/W2123469175","https://openalex.org/W2156483112","https://openalex.org/W2593634001","https://openalex.org/W2622719862","https://openalex.org/W2803832867","https://openalex.org/W2962807446","https://openalex.org/W2996320484","https://openalex.org/W2999672496","https://openalex.org/W3006348122","https://openalex.org/W3006705448","https://openalex.org/W3022414928","https://openalex.org/W3040051873","https://openalex.org/W3106022083","https://openalex.org/W3173703884","https://openalex.org/W3206479019","https://openalex.org/W4297749952","https://openalex.org/W6637108112","https://openalex.org/W6748205129","https://openalex.org/W6752051073","https://openalex.org/W6754984521","https://openalex.org/W6772316697","https://openalex.org/W6802202791"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2466816617","https://openalex.org/W1970834875","https://openalex.org/W842936808","https://openalex.org/W3174028392","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433"],"abstract_inverted_index":{"Along":[0],"with":[1],"the":[2,35,71,106,118,129,132,136,141],"practical":[3],"success":[4],"of":[5,38,73,117],"deep":[6,74],"neural":[7],"networks,":[8],"several":[9],"theories":[10],"have":[11],"been":[12],"proposed":[13,80],"to":[14,33,69,94,105,113,144],"explain":[15],"their":[16],"excellent":[17],"generalization":[18],"behaviour.":[19],"One":[20],"such":[21],"theory":[22],"is":[23,52,90],"information":[24,28,81,87,139],"bottleneck,":[25],"using":[26,77],"mutual":[27,86],"(MI)":[29],"as":[30,84],"a":[31,78],"measure":[32,82],"understand":[34],"learning":[36],"dynamics":[37],"these":[39],"black-box":[40],"models.":[41],"However,":[42],"estimating":[43],"MI":[44,97],"in":[45,49,56,98],"high":[46,99],"dimensions":[47],"and":[48,126,135],"deterministic":[50],"settings":[51],"problematic,":[53],"often":[54],"resulting":[55],"widely":[57],"varying":[58],"estimates":[59],"for":[60],"different":[61],"estimators.":[62],"This":[63],"paper":[64],"takes":[65],"an":[66],"alternative":[67],"approach":[68],"analyze":[70],"behaviour":[72],"models":[75],"by":[76],"recently":[79],"known":[83],"sliced":[85],"(SMI),":[88],"which":[89],"more":[91],"computationally":[92],"efficient":[93],"estimate":[95],"than":[96],"dimensions.":[100],"We":[101,121],"theoretically":[102],"connect":[103],"SMI":[104,124,130],"classifier":[107],"margin,":[108],"thereby":[109],"showcasing":[110],"its":[111],"ability":[112,143],"encode":[114],"geometric":[115],"properties":[116],"feature":[119],"distribution.":[120],"also":[122],"study":[123],"empirically":[125],"demonstrate":[127],"that":[128],"between":[131],"hidden":[133],"layer":[134],"labels":[137,146],"encodes":[138],"about":[140],"network\u2019s":[142],"predict":[145],"correctly.":[147]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
