{"id":"https://openalex.org/W2005555645","doi":"https://doi.org/10.1109/asru.2011.6163935","title":"Randomized maximum entropy language models","display_name":"Randomized maximum entropy language models","publication_year":2011,"publication_date":"2011-12-01","ids":{"openalex":"https://openalex.org/W2005555645","doi":"https://doi.org/10.1109/asru.2011.6163935","mag":"2005555645"},"language":"en","primary_location":{"id":"doi:10.1109/asru.2011.6163935","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru.2011.6163935","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2011 IEEE Workshop on Automatic Speech Recognition &amp; Understanding","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113753678","display_name":"Puyang Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I145311948","display_name":"Johns Hopkins University","ror":"https://ror.org/00za53h95","country_code":"US","type":"education","lineage":["https://openalex.org/I145311948"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Puyang Xu","raw_affiliation_strings":["Department of Electrical & Computer Engineering, Center of Language and Speech Processing, Johns Hopkins University, Baltimore, MD, USA","Department of Electrical & Computer Engineering, Center of Language and Speech Processing, Johns Hopkins University, Baltimore, MD 21218, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical & Computer Engineering, Center of Language and Speech Processing, Johns Hopkins University, Baltimore, MD, USA","institution_ids":["https://openalex.org/I145311948"]},{"raw_affiliation_string":"Department of Electrical & Computer Engineering, Center of Language and Speech Processing, Johns Hopkins University, Baltimore, MD 21218, USA","institution_ids":["https://openalex.org/I145311948"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014580424","display_name":"Sanjeev Khudanpur","orcid":"https://orcid.org/0000-0001-5976-0897"},"institutions":[{"id":"https://openalex.org/I145311948","display_name":"Johns Hopkins University","ror":"https://ror.org/00za53h95","country_code":"US","type":"education","lineage":["https://openalex.org/I145311948"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sanjeev Khudanpur","raw_affiliation_strings":["Department of Electrical & Computer Engineering, Center of Language and Speech Processing, Johns Hopkins University, Baltimore, MD, USA","Department of Electrical & Computer Engineering, Center of Language and Speech Processing, Johns Hopkins University, Baltimore, MD 21218, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical & Computer Engineering, Center of Language and Speech Processing, Johns Hopkins University, Baltimore, MD, USA","institution_ids":["https://openalex.org/I145311948"]},{"raw_affiliation_string":"Department of Electrical & Computer Engineering, Center of Language and Speech Processing, Johns Hopkins University, Baltimore, MD 21218, USA","institution_ids":["https://openalex.org/I145311948"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5067397403","display_name":"Asela Gunawardana","orcid":"https://orcid.org/0000-0003-3205-6589"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Asela Gunawardana","raw_affiliation_strings":["Microsoft Research, Redmond, WA, USA","[Microsoft Research, Redmond, WA 98052 USA.]"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"[Microsoft Research, Redmond, WA 98052 USA.]","institution_ids":["https://openalex.org/I1290206253"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5113753678"],"corresponding_institution_ids":["https://openalex.org/I145311948"],"apc_list":null,"apc_paid":null,"fwci":1.3207,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.83751349,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"226","last_page":"230"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7558538913726807},{"id":"https://openalex.org/keywords/bloom-filter","display_name":"Bloom filter","score":0.7314944863319397},{"id":"https://openalex.org/keywords/hash-function","display_name":"Hash function","score":0.7197140455245972},{"id":"https://openalex.org/keywords/perplexity","display_name":"Perplexity","score":0.6471580266952515},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.5661119818687439},{"id":"https://openalex.org/keywords/data-structure","display_name":"Data structure","score":0.5037564635276794},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4938252866268158},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4568837285041809},{"id":"https://openalex.org/keywords/hash-table","display_name":"Hash table","score":0.4392147660255432},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3389558792114258},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.336297869682312},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2851596474647522}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7558538913726807},{"id":"https://openalex.org/C147224247","wikidata":"https://www.wikidata.org/wiki/Q885373","display_name":"Bloom filter","level":2,"score":0.7314944863319397},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.7197140455245972},{"id":"https://openalex.org/C100279451","wikidata":"https://www.wikidata.org/wiki/Q372193","display_name":"Perplexity","level":3,"score":0.6471580266952515},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.5661119818687439},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.5037564635276794},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4938252866268158},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4568837285041809},{"id":"https://openalex.org/C67388219","wikidata":"https://www.wikidata.org/wiki/Q207440","display_name":"Hash table","level":3,"score":0.4392147660255432},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3389558792114258},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.336297869682312},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2851596474647522},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/asru.2011.6163935","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru.2011.6163935","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2011 IEEE Workshop on Automatic Speech Recognition &amp; Understanding","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.433.2679","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.433.2679","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.clsp.jhu.edu/~puyang/papers/rmelm_final.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W45102278","https://openalex.org/W87260881","https://openalex.org/W115367774","https://openalex.org/W162552777","https://openalex.org/W1605569224","https://openalex.org/W1797288984","https://openalex.org/W1996903695","https://openalex.org/W2017708149","https://openalex.org/W2070996757","https://openalex.org/W2091825929","https://openalex.org/W2098318492","https://openalex.org/W2109664771","https://openalex.org/W2111305191","https://openalex.org/W2114858359","https://openalex.org/W2122429665","https://openalex.org/W2123845384","https://openalex.org/W2130180273","https://openalex.org/W2143866356","https://openalex.org/W2155794909","https://openalex.org/W6601826859","https://openalex.org/W6603602746","https://openalex.org/W6604704417","https://openalex.org/W6606526954","https://openalex.org/W6636442488","https://openalex.org/W6638218882","https://openalex.org/W6676373471","https://openalex.org/W6678306947","https://openalex.org/W6682636730"],"related_works":["https://openalex.org/W2169518243","https://openalex.org/W2252095989","https://openalex.org/W4322096525","https://openalex.org/W2551914602","https://openalex.org/W4281893144","https://openalex.org/W4287323699","https://openalex.org/W2105076537","https://openalex.org/W2084531783","https://openalex.org/W2902731467","https://openalex.org/W2787311093"],"abstract_inverted_index":{"We":[0,52,64],"address":[1],"the":[2,32,43,55],"memory":[3],"problem":[4],"of":[5,58,73],"maximum":[6],"entropy":[7],"language":[8],"models":[9],"(MELM)":[10],"with":[11,60,66],"very":[12],"large":[13,100],"feature":[14,38,44],"sets.":[15],"Randomized":[16],"techniques":[17],"are":[18,90],"employed":[19],"to":[20,39,101],"remove":[21],"all":[22],"large,":[23],"exact":[24],"data":[25],"structures":[26],"in":[27],"MELM":[28,94],"implementations.":[29],"To":[30],"avoid":[31],"dictionary":[33],"structure":[34],"that":[35,69,95],"maps":[36],"each":[37],"its":[40],"corresponding":[41],"weight,":[42],"hashing":[45],"trick":[46],"[1]":[47],"[2]":[48],"can":[49],"be":[50,98],"used.":[51],"also":[53],"replace":[54],"explicit":[56],"storage":[57],"features":[59],"a":[61],"Bloom":[62,74],"filter.":[63],"show":[65],"extensive":[67],"experiments":[68],"false":[70],"positive":[71],"errors":[72],"filters":[75],"and":[76,87],"random":[77],"hash":[78],"collisions":[79],"do":[80],"not":[81],"degrade":[82],"model":[83],"performance.":[84],"Both":[85],"perplexity":[86],"WER":[88],"improvements":[89],"demonstrated":[91],"by":[92],"building":[93],"would":[96],"otherwise":[97],"prohibitively":[99],"estimate":[102],"or":[103],"store.":[104]},"counts_by_year":[{"year":2017,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
