{"id":"https://openalex.org/W2510403588","doi":"https://doi.org/10.18653/v1/p16-1022","title":"Compressing Neural Language Models by Sparse Word Representations","display_name":"Compressing Neural Language Models by Sparse Word Representations","publication_year":2016,"publication_date":"2016-01-01","ids":{"openalex":"https://openalex.org/W2510403588","doi":"https://doi.org/10.18653/v1/p16-1022","mag":"2510403588"},"language":"en","primary_location":{"id":"doi:10.18653/v1/p16-1022","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p16-1022","pdf_url":"https://www.aclweb.org/anthology/P16-1022.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/P16-1022.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049517695","display_name":"Yunchuan Chen","orcid":"https://orcid.org/0000-0002-7671-6350"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunchuan Chen","raw_affiliation_strings":["Key Laboratory of High Confidence Software Technologies (Peking University), MoE, China","University of Chinese Academy of Sciences,"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Key Laboratory of High Confidence Software Technologies (Peking University), MoE, China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences,","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024821632","display_name":"Lili Mou","orcid":"https://orcid.org/0000-0001-7753-4295"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4210128818","display_name":"Institute of Software","ror":"https://ror.org/033dfsn42","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210128818"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lili Mou","raw_affiliation_strings":["Institute of Software, Peking University,","Key Laboratory of High Confidence Software Technologies (Peking University), MoE, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Software, Peking University,","institution_ids":["https://openalex.org/I4210128818","https://openalex.org/I20231570"]},{"raw_affiliation_string":"Key Laboratory of High Confidence Software Technologies (Peking University), MoE, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100378208","display_name":"Yan Xu","orcid":"https://orcid.org/0000-0002-0271-044X"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4210128818","display_name":"Institute of Software","ror":"https://ror.org/033dfsn42","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210128818"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yan Xu","raw_affiliation_strings":["Institute of Software, Peking University,","Key Laboratory of High Confidence Software Technologies (Peking University), MoE, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Software, Peking University,","institution_ids":["https://openalex.org/I4210128818","https://openalex.org/I20231570"]},{"raw_affiliation_string":"Key Laboratory of High Confidence Software Technologies (Peking University), MoE, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100447691","display_name":"Ge Li","orcid":"https://orcid.org/0000-0003-0140-0949"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4210128818","display_name":"Institute of Software","ror":"https://ror.org/033dfsn42","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210128818"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ge Li","raw_affiliation_strings":["Institute of Software, Peking University,","Key Laboratory of High Confidence Software Technologies (Peking University), MoE, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Software, Peking University,","institution_ids":["https://openalex.org/I4210128818","https://openalex.org/I20231570"]},{"raw_affiliation_string":"Key Laboratory of High Confidence Software Technologies (Peking University), MoE, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049100391","display_name":"Zhi Jin","orcid":"https://orcid.org/0000-0003-1087-226X"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4210128818","display_name":"Institute of Software","ror":"https://ror.org/033dfsn42","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210128818"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhi Jin","raw_affiliation_strings":["Institute of Software, Peking University,","Key Laboratory of High Confidence Software Technologies (Peking University), MoE, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Software, Peking University,","institution_ids":["https://openalex.org/I4210128818","https://openalex.org/I20231570"]},{"raw_affiliation_string":"Key Laboratory of High Confidence Software Technologies (Peking University), MoE, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.0912,"has_fulltext":true,"cited_by_count":18,"citation_normalized_percentile":{"value":0.93031257,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":97},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/perplexity","display_name":"Perplexity","score":0.9156615734100342},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7889516353607178},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.7580975890159607},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.6744823455810547},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.6305767297744751},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5936009883880615},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5610872507095337},{"id":"https://openalex.org/keywords/layer","display_name":"Layer (electronics)","score":0.5293166041374207},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5291234254837036},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4879254996776581},{"id":"https://openalex.org/keywords/context-model","display_name":"Context model","score":0.4421907067298889},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3908958435058594},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14632651209831238}],"concepts":[{"id":"https://openalex.org/C100279451","wikidata":"https://www.wikidata.org/wiki/Q372193","display_name":"Perplexity","level":3,"score":0.9156615734100342},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7889516353607178},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.7580975890159607},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.6744823455810547},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.6305767297744751},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5936009883880615},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5610872507095337},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.5293166041374207},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5291234254837036},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4879254996776581},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.4421907067298889},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3908958435058594},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14632651209831238},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/p16-1022","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p16-1022","pdf_url":"https://www.aclweb.org/anthology/P16-1022.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/p16-1022","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p16-1022","pdf_url":"https://www.aclweb.org/anthology/P16-1022.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.800000011920929,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G1828425977","display_name":null,"funder_award_id":"973 Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2039607704","display_name":null,"funder_award_id":"2015CB352201","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G4512837029","display_name":"\u4e92\u8054\u7f51\u73af\u5883\u4e0b\u57fa\u4e8e\u77e5\u4ef6\u7684\u9700\u6c42\u9a71\u52a8\u77e5\u8bc6\u670d\u52a1\u7406\u8bba\u548c\u6280\u672f\u7814\u7a76","funder_award_id":"61232015","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4722731998","display_name":null,"funder_award_id":"91318301","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5152043508","display_name":null,"funder_award_id":"61421091","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2510403588.pdf","grobid_xml":"https://content.openalex.org/works/W2510403588.grobid-xml"},"referenced_works_count":39,"referenced_works":["https://openalex.org/W36903255","https://openalex.org/W179875071","https://openalex.org/W182831726","https://openalex.org/W591148856","https://openalex.org/W1512874001","https://openalex.org/W1518951372","https://openalex.org/W1522301498","https://openalex.org/W1558797106","https://openalex.org/W1614298861","https://openalex.org/W1631260214","https://openalex.org/W1724438581","https://openalex.org/W1821462560","https://openalex.org/W1841959837","https://openalex.org/W1843891098","https://openalex.org/W1951216520","https://openalex.org/W1965154800","https://openalex.org/W1985258458","https://openalex.org/W1996901117","https://openalex.org/W2085400714","https://openalex.org/W2091812280","https://openalex.org/W2100664567","https://openalex.org/W2113606819","https://openalex.org/W2120861206","https://openalex.org/W2138204974","https://openalex.org/W2140610559","https://openalex.org/W2250189634","https://openalex.org/W2251682575","https://openalex.org/W2294370754","https://openalex.org/W2295800168","https://openalex.org/W2340329281","https://openalex.org/W2384495648","https://openalex.org/W2950577311","https://openalex.org/W2950797609","https://openalex.org/W2952822287","https://openalex.org/W2962965405","https://openalex.org/W2963932686","https://openalex.org/W2964121744","https://openalex.org/W2998704965","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W2169518243","https://openalex.org/W2252095989","https://openalex.org/W4322096525","https://openalex.org/W2551914602","https://openalex.org/W4281893144","https://openalex.org/W2105076537","https://openalex.org/W2787311093","https://openalex.org/W2084531783","https://openalex.org/W2020757772","https://openalex.org/W2402231715"],"abstract_inverted_index":{"Neural":[0],"networks":[1],"are":[2,46],"among":[3],"the":[4,27,38,41,51,60,78,80,91,94,107,117,122],"state-ofthe-art":[5],"techniques":[6],"for":[7,56],"language":[8,12,71],"modeling.":[9],"Existing":[10],"neural":[11,70],"models":[13,72],"typically":[14],"map":[15],"discrete":[16],"words":[17,30],"to":[18,68,110],"distributed,":[19],"dense":[20],"vector":[21],"representations.":[22,76],"After":[23],"information":[24],"processing":[25],"of":[26,40,50,54,82,93,121],"preceding":[28],"context":[29],"by":[31,73],"hidden":[32],"layers,":[33],"an":[34],"output":[35,61],"layer":[36],"estimates":[37],"probability":[39],"next":[42],"word.":[43],"Such":[44],"approaches":[45],"time-and":[47],"memory-intensive":[48],"because":[49],"large":[52,112],"numbers":[53],"parameters":[55,83],"word":[57,75],"embeddings":[58],"and":[59],"layer.":[62],"In":[63,77],"this":[64],"paper,":[65],"we":[66],"propose":[67],"compress":[69],"sparse":[74],"experiments,":[79],"number":[81],"in":[84,119],"our":[85,102],"model":[86],"increases":[87],"very":[88],"slowly":[89],"with":[90],"growth":[92],"vocabulary":[95],"size,":[96],"which":[97],"is":[98],"almost":[99],"imperceptible.":[100],"Moreover,":[101],"approach":[103],"not":[104],"only":[105],"reduces":[106],"parameter":[108],"space":[109],"a":[111],"extent,":[113],"but":[114],"also":[115],"improves":[116],"performance":[118],"terms":[120],"perplexity":[123],"measure.":[124],"1":[125]},"counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":2}],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
