{"id":"https://openalex.org/W3094216089","doi":"https://doi.org/10.1145/3340531.3412171","title":"Compression of Deep Learning Models for NLP","display_name":"Compression of Deep Learning Models for NLP","publication_year":2020,"publication_date":"2020-10-19","ids":{"openalex":"https://openalex.org/W3094216089","doi":"https://doi.org/10.1145/3340531.3412171","mag":"3094216089"},"language":"en","primary_location":{"id":"doi:10.1145/3340531.3412171","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3340531.3412171","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Information &amp; Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5046755750","display_name":"Manish Gupta","orcid":"https://orcid.org/0000-0002-2843-3110"},"institutions":[{"id":"https://openalex.org/I4210162141","display_name":"Microsoft (India)","ror":"https://ror.org/04ww0w091","country_code":"IN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210162141"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Manish Gupta","raw_affiliation_strings":["Microsoft, Hyderabad, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Microsoft, Hyderabad, India","institution_ids":["https://openalex.org/I4210162141"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073786634","display_name":"Vasudeva Varma","orcid":"https://orcid.org/0000-0003-1923-1725"},"institutions":[{"id":"https://openalex.org/I64189192","display_name":"International Institute of Information Technology, Hyderabad","ror":"https://ror.org/05f11g639","country_code":"IN","type":"education","lineage":["https://openalex.org/I64189192"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Vasudeva Varma","raw_affiliation_strings":["International Institute of Information Technology Hyderabad, Hyderabad, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"International Institute of Information Technology Hyderabad, Hyderabad, India","institution_ids":["https://openalex.org/I64189192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005355449","display_name":"Sonam Damani","orcid":null},"institutions":[{"id":"https://openalex.org/I4210162141","display_name":"Microsoft (India)","ror":"https://ror.org/04ww0w091","country_code":"IN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210162141"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Sonam Damani","raw_affiliation_strings":["Microsoft, Hyderabad, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Microsoft, Hyderabad, India","institution_ids":["https://openalex.org/I4210162141"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033118922","display_name":"Kedhar Nath Narahari","orcid":null},"institutions":[{"id":"https://openalex.org/I4210162141","display_name":"Microsoft (India)","ror":"https://ror.org/04ww0w091","country_code":"IN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210162141"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Kedhar Nath Narahari","raw_affiliation_strings":["Microsoft, Hyderabad, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Microsoft, Hyderabad, India","institution_ids":["https://openalex.org/I4210162141"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.8125,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.79565529,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"3507","last_page":"3508"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9847000241279602,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8185878396034241},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6796788573265076},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6674247980117798},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.6567657589912415},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.5824214816093445},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.47039493918418884},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.4385085701942444},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08428353071212769},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.07954001426696777}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8185878396034241},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6796788573265076},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6674247980117798},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.6567657589912415},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.5824214816093445},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.47039493918418884},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.4385085701942444},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08428353071212769},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.07954001426696777},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3340531.3412171","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3340531.3412171","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Information &amp; Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6600000262260437,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W1821462560","https://openalex.org/W2084910356","https://openalex.org/W2119144962","https://openalex.org/W2134797427","https://openalex.org/W2312434537","https://openalex.org/W2460130460","https://openalex.org/W2512629640","https://openalex.org/W2626778328","https://openalex.org/W2653504903","https://openalex.org/W2764043458","https://openalex.org/W2767785892","https://openalex.org/W2769137120","https://openalex.org/W2786548044","https://openalex.org/W2787017828","https://openalex.org/W2787752464","https://openalex.org/W2866343820","https://openalex.org/W2904107554","https://openalex.org/W2914294010","https://openalex.org/W2915716523","https://openalex.org/W2919207648","https://openalex.org/W2924902521","https://openalex.org/W2937297214","https://openalex.org/W2940744433","https://openalex.org/W2945767825","https://openalex.org/W2950455323","https://openalex.org/W2952383053","https://openalex.org/W2952533036","https://openalex.org/W2963643655","https://openalex.org/W2963703075","https://openalex.org/W2963736842","https://openalex.org/W2963838731","https://openalex.org/W2963991999","https://openalex.org/W2964305088","https://openalex.org/W2969515962","https://openalex.org/W2970213198","https://openalex.org/W2970454332","https://openalex.org/W2971842688","https://openalex.org/W2976132230","https://openalex.org/W3001665736","https://openalex.org/W3103522166","https://openalex.org/W3104216863"],"related_works":["https://openalex.org/W96612179","https://openalex.org/W2566006169","https://openalex.org/W2770234245","https://openalex.org/W2987774938","https://openalex.org/W632915154","https://openalex.org/W4229499248","https://openalex.org/W4378874356","https://openalex.org/W2055733372","https://openalex.org/W2369811061","https://openalex.org/W4380075502"],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"the":[3,88,100,125,132],"fields":[4],"of":[5,58,75,91,103],"NLP":[6,85],"and":[7,21,23,47,68,96,99,136],"information":[8],"retrieval":[9],"have":[10],"made":[11],"tremendous":[12],"progress":[13],"thanks":[14],"to":[15,78],"deep":[16],"learning":[17,127],"models":[18,26,31,77],"like":[19,27],"RNNs":[20],"LSTMs,":[22],"Transformer[35]":[24],"based":[25,71],"BERT[9].":[28],"But":[29],"these":[30],"are":[32],"humongous":[33],"in":[34,82,107,131],"size.":[35],"Real":[36],"world":[37],"applications":[38,93],"however":[39],"demand":[40],"small":[41,97],"model":[42],"size,":[43],"low":[44,48],"response":[45],"times":[46],"computational":[49],"power":[50],"wattage.":[51],"We":[52,118],"will":[53,119],"discuss":[54],"six":[55],"different":[56],"types":[57],"methods":[59],"(pruning,":[60],"quantization,":[61],"knowledge":[62],"distillation,":[63],"parameter":[64],"sharing,":[65],"matrix":[66],"decomposition,":[67],"other":[69],"Transformer":[70],"methods)":[72],"for":[73,128],"compression":[74],"such":[76],"enable":[79],"their":[80],"deployment":[81],"real":[83],"industry":[84],"projects.":[86],"Given":[87],"critical":[89],"need":[90],"building":[92],"with":[94],"efficient":[95],"models,":[98],"large":[101],"amount":[102],"recently":[104],"published":[105],"work":[106,122],"this":[108,113],"area,":[109],"we":[110],"believe":[111],"that":[112],"tutorial":[114],"is":[115],"very":[116],"timely.":[117],"organize":[120],"related":[121],"done":[123],"by":[124],"'deep":[126],"NLP'":[129],"community":[130],"past":[133],"few":[134],"years":[135],"present":[137],"it":[138],"as":[139],"a":[140],"coherent":[141],"story.":[142]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":4}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
