{"id":"https://openalex.org/W2787237356","doi":"https://doi.org/10.18653/v1/p18-2116","title":"Long Short-Term Memory as a Dynamically Computed Element-wise Weighted Sum","display_name":"Long Short-Term Memory as a Dynamically Computed Element-wise Weighted Sum","publication_year":2018,"publication_date":"2018-01-01","ids":{"openalex":"https://openalex.org/W2787237356","doi":"https://doi.org/10.18653/v1/p18-2116","mag":"2787237356"},"language":"en","primary_location":{"id":"doi:10.18653/v1/p18-2116","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p18-2116","pdf_url":"https://www.aclweb.org/anthology/P18-2116.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/P18-2116.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024311574","display_name":"Omer Levy","orcid":"https://orcid.org/0000-0001-7300-8191"},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]},{"id":"https://openalex.org/I58610484","display_name":"Seattle University","ror":"https://ror.org/02jqc0m91","country_code":"US","type":"education","lineage":["https://openalex.org/I58610484"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Omer Levy","raw_affiliation_strings":["School, University of Washington, Seattle, WA","University of Washington, Seattle, United States"],"affiliations":[{"raw_affiliation_string":"School, University of Washington, Seattle, WA","institution_ids":["https://openalex.org/I201448701"]},{"raw_affiliation_string":"University of Washington, Seattle, United States","institution_ids":["https://openalex.org/I58610484","https://openalex.org/I201448701"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081862885","display_name":"Kenton Lee","orcid":"https://orcid.org/0000-0002-9534-5970"},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]},{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kenton Lee","raw_affiliation_strings":["School, University of Washington, Seattle, WA","Google (United States), Mountain View, United States"],"affiliations":[{"raw_affiliation_string":"School, University of Washington, Seattle, WA","institution_ids":["https://openalex.org/I201448701"]},{"raw_affiliation_string":"Google (United States), Mountain View, United States","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073439637","display_name":"Nicholas FitzGerald","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nicholas FitzGerald","raw_affiliation_strings":["School, University of Washington, Seattle, WA","Google (United States), Mountain View, United States"],"affiliations":[{"raw_affiliation_string":"School, University of Washington, Seattle, WA","institution_ids":["https://openalex.org/I201448701"]},{"raw_affiliation_string":"Google (United States), Mountain View, United States","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5067919401","display_name":"Luke Zettlemoyer","orcid":"https://orcid.org/0009-0008-8296-0764"},"institutions":[{"id":"https://openalex.org/I58610484","display_name":"Seattle University","ror":"https://ror.org/02jqc0m91","country_code":"US","type":"education","lineage":["https://openalex.org/I58610484"]},{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Luke Zettlemoyer","raw_affiliation_strings":["School, University of Washington, Seattle, WA","University of Washington, Seattle, United States"],"affiliations":[{"raw_affiliation_string":"School, University of Washington, Seattle, WA","institution_ids":["https://openalex.org/I201448701"]},{"raw_affiliation_string":"University of Washington, Seattle, United States","institution_ids":["https://openalex.org/I58610484","https://openalex.org/I201448701"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5024311574"],"corresponding_institution_ids":["https://openalex.org/I201448701","https://openalex.org/I58610484"],"apc_list":null,"apc_paid":null,"fwci":2.2001,"has_fulltext":true,"cited_by_count":14,"citation_normalized_percentile":{"value":0.90357529,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"732","last_page":"739"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/decoupling","display_name":"Decoupling (probability)","score":0.8640694618225098},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7131778597831726},{"id":"https://openalex.org/keywords/long-short-term-memory","display_name":"Long short term memory","score":0.6709926128387451},{"id":"https://openalex.org/keywords/element","display_name":"Element (criminal law)","score":0.6265368461608887},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.6137229800224304},{"id":"https://openalex.org/keywords/simple","display_name":"Simple (philosophy)","score":0.5593229532241821},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5070674419403076},{"id":"https://openalex.org/keywords/gating","display_name":"Gating","score":0.4992237091064453},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4913753569126129},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.4383242428302765},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4276989996433258},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4130893349647522},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3412031829357147},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.16654255986213684},{"id":"https://openalex.org/keywords/neuroscience","display_name":"Neuroscience","score":0.06614643335342407}],"concepts":[{"id":"https://openalex.org/C205606062","wikidata":"https://www.wikidata.org/wiki/Q5249645","display_name":"Decoupling (probability)","level":2,"score":0.8640694618225098},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7131778597831726},{"id":"https://openalex.org/C133488467","wikidata":"https://www.wikidata.org/wiki/Q6673524","display_name":"Long short term memory","level":4,"score":0.6709926128387451},{"id":"https://openalex.org/C200288055","wikidata":"https://www.wikidata.org/wiki/Q2621792","display_name":"Element (criminal law)","level":2,"score":0.6265368461608887},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.6137229800224304},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.5593229532241821},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5070674419403076},{"id":"https://openalex.org/C194544171","wikidata":"https://www.wikidata.org/wiki/Q21105679","display_name":"Gating","level":2,"score":0.4992237091064453},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4913753569126129},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.4383242428302765},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4276989996433258},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4130893349647522},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3412031829357147},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.16654255986213684},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.06614643335342407},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.18653/v1/p18-2116","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p18-2116","pdf_url":"https://www.aclweb.org/anthology/P18-2116.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1805.03716","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1805.03716","pdf_url":"https://arxiv.org/pdf/1805.03716","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:2787237356","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1805.03716.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1805.03716","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1805.03716","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.18653/v1/p18-2116","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p18-2116","pdf_url":"https://www.aclweb.org/anthology/P18-2116.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1746478","display_name":null,"funder_award_id":"FA8750-13-2-0019","funder_id":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency"},{"id":"https://openalex.org/G290391106","display_name":null,"funder_award_id":"FA8750-13-2-001","funder_id":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency"},{"id":"https://openalex.org/G3366966419","display_name":null,"funder_award_id":"W911NF-16-1","funder_id":"https://openalex.org/F4320338281","funder_display_name":"Army Research Office"},{"id":"https://openalex.org/G4713059963","display_name":null,"funder_award_id":"FA8750","funder_id":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency"},{"id":"https://openalex.org/G5524522455","display_name":null,"funder_award_id":"DARPA","funder_id":"https://openalex.org/F4320338281","funder_display_name":"Army Research Office"},{"id":"https://openalex.org/G6497436218","display_name":"CAREER: Learning Scalable Models for Grounded Semantic Parsing","funder_award_id":"1252835","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G657448715","display_name":null,"funder_award_id":"W911NF-16-1-","funder_id":"https://openalex.org/F4320338281","funder_display_name":"Army Research Office"},{"id":"https://openalex.org/G7452299184","display_name":null,"funder_award_id":"W911NF","funder_id":"https://openalex.org/F4320338281","funder_display_name":"Army Research Office"},{"id":"https://openalex.org/G7750423253","display_name":null,"funder_award_id":"IIS-1562364","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8533175095","display_name":"RI: Medium: Broad-Coverage Semantic Parsing: Linguistic Representation Learning from Crowd-Scale Data","funder_award_id":"1562364","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8998121839","display_name":null,"funder_award_id":"911NF","funder_id":"https://openalex.org/F4320338281","funder_display_name":"Army Research Office"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320309480","display_name":"Nvidia","ror":"https://ror.org/03jdj4y14"},{"id":"https://openalex.org/F4320316083","display_name":"Tencent","ror":"https://ror.org/00hhjss72"},{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"},{"id":"https://openalex.org/F4320338281","display_name":"Army Research Office","ror":"https://ror.org/05epdh915"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2787237356.pdf","grobid_xml":"https://content.openalex.org/works/W2787237356.grobid-xml"},"referenced_works_count":18,"referenced_works":["https://openalex.org/W194249466","https://openalex.org/W581956982","https://openalex.org/W1591801644","https://openalex.org/W1632114991","https://openalex.org/W1689711448","https://openalex.org/W2110485445","https://openalex.org/W2250263931","https://openalex.org/W2267186426","https://openalex.org/W2427527485","https://openalex.org/W2515741950","https://openalex.org/W2618101654","https://openalex.org/W2626778328","https://openalex.org/W2740765036","https://openalex.org/W2890177507","https://openalex.org/W2950297649","https://openalex.org/W2952436057","https://openalex.org/W2963212250","https://openalex.org/W2964308564"],"related_works":["https://openalex.org/W2963410683","https://openalex.org/W2064675550","https://openalex.org/W2947629814","https://openalex.org/W3033597970","https://openalex.org/W2740137140","https://openalex.org/W2969672740","https://openalex.org/W2970418991","https://openalex.org/W1980324747","https://openalex.org/W3135038743","https://openalex.org/W2964202535","https://openalex.org/W2989958114","https://openalex.org/W2949821897","https://openalex.org/W2752658941","https://openalex.org/W3132271517","https://openalex.org/W2030990735","https://openalex.org/W2950016430","https://openalex.org/W2970954235","https://openalex.org/W2069143585","https://openalex.org/W2951375073","https://openalex.org/W2790155499"],"abstract_inverted_index":{"LSTMs":[0],"were":[1],"introduced":[2],"to":[3,23],"combat":[4],"vanishing":[5,112],"gradients":[6],"in":[7,95,107],"simple":[8,55],"RNNs":[9,62],"by":[10,47],"augmenting":[11],"them":[12],"with":[13],"gated":[14],"additive":[15],"recurrent":[16,34],"connections.":[17],"We":[18,44],"present":[19],"an":[20,67,93],"alternative":[21],"view":[22],"explain":[24],"the":[25,29,49,53,64,75,85,101],"success":[26],"of":[27,61,71,74,81],"LSTMs:":[28],"gates":[30,51,102],"themselves":[31],"are":[32,103],"versatile":[33],"models":[35],"that":[36,84,100],"provide":[37],"more":[38,106],"representational":[39],"power":[40],"than":[41,109],"previously":[42],"appreciated.":[43],"do":[45],"this":[46],"decoupling":[48],"LSTM's":[50],"from":[52],"embedded":[54],"RNN,":[56],"producing":[57],"a":[58,79],"new":[59],"class":[60],"where":[63],"recurrence":[65],"computes":[66],"element-wise":[68],"weighted":[69],"sum":[70],"context-independent":[72],"functions":[73],"input.":[76],"Ablations":[77],"on":[78],"range":[80],"problems":[82],"demonstrate":[83],"gating":[86],"mechanism":[87],"alone":[88],"performs":[89],"as":[90,92],"well":[91],"LSTM":[94],"most":[96],"settings,":[97],"strongly":[98],"suggesting":[99],"doing":[104],"much":[105],"practice":[108],"just":[110],"alleviating":[111],"gradients.":[113]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":3}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
