{"id":"https://openalex.org/W4380551263","doi":"https://doi.org/10.48550/arxiv.2306.06238","title":"Understanding the Effect of the Long Tail on Neural Network Compression","display_name":"Understanding the Effect of the Long Tail on Neural Network Compression","publication_year":2023,"publication_date":"2023-06-09","ids":{"openalex":"https://openalex.org/W4380551263","doi":"https://doi.org/10.48550/arxiv.2306.06238"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2306.06238","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.06238","pdf_url":"https://arxiv.org/pdf/2306.06238","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2306.06238","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058305816","display_name":"Harvey Dam","orcid":"https://orcid.org/0009-0005-9878-7642"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Dam, Harvey","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015629734","display_name":"V. Roshan Joseph","orcid":"https://orcid.org/0000-0002-9430-5301"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Joseph, Vinu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014414126","display_name":"Aditya Bhaskara","orcid":"https://orcid.org/0000-0001-5505-3140"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bhaskara, Aditya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025343365","display_name":"Ganesh Gopalakrishna","orcid":"https://orcid.org/0000-0001-5883-919X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gopalakrishnan, Ganesh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033185286","display_name":"Saurav Muralidharan","orcid":"https://orcid.org/0000-0003-4024-3958"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Muralidharan, Saurav","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5024606205","display_name":"Michael Garland","orcid":"https://orcid.org/0000-0001-6093-7602"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Garland, Michael","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5058305816"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9947999715805054,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/memorization","display_name":"Memorization","score":0.771263599395752},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7429792284965515},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6452480554580688},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.631655752658844},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.615484893321991},{"id":"https://openalex.org/keywords/compression","display_name":"Compression (physics)","score":0.5908589363098145},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5407495498657227},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.531548023223877},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.5176082849502563},{"id":"https://openalex.org/keywords/equivalence","display_name":"Equivalence (formal languages)","score":0.46042418479919434},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.44895613193511963},{"id":"https://openalex.org/keywords/image-compression","display_name":"Image compression","score":0.4287306070327759},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4246545433998108},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.21280965209007263},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.138264000415802},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.09689748287200928}],"concepts":[{"id":"https://openalex.org/C30038468","wikidata":"https://www.wikidata.org/wiki/Q4354775","display_name":"Memorization","level":2,"score":0.771263599395752},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7429792284965515},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6452480554580688},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.631655752658844},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.615484893321991},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.5908589363098145},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5407495498657227},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.531548023223877},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.5176082849502563},{"id":"https://openalex.org/C2780069185","wikidata":"https://www.wikidata.org/wiki/Q7977945","display_name":"Equivalence (formal languages)","level":2,"score":0.46042418479919434},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.44895613193511963},{"id":"https://openalex.org/C13481523","wikidata":"https://www.wikidata.org/wiki/Q412438","display_name":"Image compression","level":4,"score":0.4287306070327759},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4246545433998108},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.21280965209007263},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.138264000415802},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.09689748287200928},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C145420912","wikidata":"https://www.wikidata.org/wiki/Q853077","display_name":"Mathematics education","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2306.06238","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.06238","pdf_url":"https://arxiv.org/pdf/2306.06238","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2306.06238","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2306.06238","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2306.06238","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.06238","pdf_url":"https://arxiv.org/pdf/2306.06238","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4380551263.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2129829718","https://openalex.org/W2521595930","https://openalex.org/W4243608781","https://openalex.org/W3165542721","https://openalex.org/W4313046148","https://openalex.org/W1939109514","https://openalex.org/W4378191574","https://openalex.org/W2161981399","https://openalex.org/W2612632602","https://openalex.org/W2595043295"],"abstract_inverted_index":{"Network":[0],"compression":[1,79,128,177],"is":[2,121],"now":[3],"a":[4,133],"mature":[5],"sub-field":[6],"of":[7,24,98,116,132],"neural":[8],"network":[9,78,134],"research:":[10],"over":[11],"the":[12,22,32,44,58,71,85,96,99,130,144,149,156],"last":[13],"decade,":[14],"significant":[15],"progress":[16],"has":[17,52],"been":[18,53],"made":[19],"towards":[20,66],"reducing":[21],"size":[23],"models":[25,62,153],"and":[26,60,151,176],"speeding":[27],"up":[28],"inference,":[29],"while":[30,80],"maintaining":[31,81],"classification":[33,169],"accuracy.":[34],"However,":[35],"many":[36],"works":[37],"have":[38],"observed":[39,107],"that":[40,55,114],"focusing":[41],"on":[42],"just":[43],"overall":[45],"accuracy":[46],"can":[47,63,75],"be":[48,64],"misguided.":[49],"E.g.,":[50],"it":[51],"shown":[54],"mismatches":[56,147],"between":[57,148],"full":[59,150],"compressed":[61,152],"biased":[65],"under-represented":[67],"classes.":[68],"This":[69],"raises":[70],"important":[72],"research":[73],"question,":[74],"we":[76,91,142],"achieve":[77],"\"semantic":[82],"equivalence\"":[83],"with":[84,155],"original":[86],"network?":[87],"In":[88],"this":[89,93,165],"work,":[90],"study":[92,143],"question":[94],"in":[95,103,164],"context":[97],"\"long":[100],"tail\"":[101],"phenomenon":[102],"computer":[104],"vision":[105],"datasets":[106],"by":[108,171],"Feldman,":[109],"et":[110],"al.":[111],"They":[112],"argue":[113],"memorization":[115],"certain":[117],"inputs":[118],"(appropriately":[119],"defined)":[120],"essential":[122],"to":[123,140],"achieving":[124],"good":[125],"generalization.":[126],"As":[127],"limits":[129],"capacity":[131],"(and":[135],"hence":[136],"also":[137],"its":[138],"ability":[139],"memorize),":[141],"question:":[145],"are":[146],"correlated":[154],"memorized":[157],"training":[158],"data?":[159],"We":[160],"present":[161],"positive":[162],"evidence":[163],"direction":[166],"for":[167],"image":[168],"tasks,":[170],"considering":[172],"different":[173],"base":[174],"architectures":[175],"schemes.":[178]},"counts_by_year":[],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2025-10-10T00:00:00"}
