{"id":"https://openalex.org/W2904535507","doi":"https://doi.org/10.1609/aaai.v33i01.33013280","title":"Towards Non-Saturating Recurrent Units for Modelling Long-Term Dependencies","display_name":"Towards Non-Saturating Recurrent Units for Modelling Long-Term Dependencies","publication_year":2019,"publication_date":"2019-07-17","ids":{"openalex":"https://openalex.org/W2904535507","doi":"https://doi.org/10.1609/aaai.v33i01.33013280","mag":"2904535507"},"language":"en","primary_location":{"id":"doi:10.1609/aaai.v33i01.33013280","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v33i01.33013280","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4200/4078","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4200/4078","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5104083090","display_name":"Sarath Chandar","orcid":null},"institutions":[{"id":"https://openalex.org/I70931966","display_name":"Universit\u00e9 de Montr\u00e9al","ror":"https://ror.org/0161xgx34","country_code":"CA","type":"education","lineage":["https://openalex.org/I70931966"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Sarath Chandar","raw_affiliation_strings":["University of Montreal"],"affiliations":[{"raw_affiliation_string":"University of Montreal","institution_ids":["https://openalex.org/I70931966"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039984997","display_name":"Chinnadhurai Sankar","orcid":null},"institutions":[{"id":"https://openalex.org/I70931966","display_name":"Universit\u00e9 de Montr\u00e9al","ror":"https://ror.org/0161xgx34","country_code":"CA","type":"education","lineage":["https://openalex.org/I70931966"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Chinnadhurai Sankar","raw_affiliation_strings":["University of Montreal"],"affiliations":[{"raw_affiliation_string":"University of Montreal","institution_ids":["https://openalex.org/I70931966"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008902493","display_name":"Eugene Vorontsov","orcid":"https://orcid.org/0000-0002-4530-533X"},"institutions":[{"id":"https://openalex.org/I45683168","display_name":"Polytechnique Montr\u00e9al","ror":"https://ror.org/05f8d4e86","country_code":"CA","type":"education","lineage":["https://openalex.org/I45683168"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Eugene Vorontsov","raw_affiliation_strings":["Polytechnique Montreal"],"affiliations":[{"raw_affiliation_string":"Polytechnique Montreal","institution_ids":["https://openalex.org/I45683168"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032466547","display_name":"Samira Ebrahimi Kahou","orcid":null},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Samira Ebrahimi Kahou","raw_affiliation_strings":["Microsoft"],"affiliations":[{"raw_affiliation_string":"Microsoft","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086198262","display_name":"Yoshua Bengio","orcid":"https://orcid.org/0000-0002-9322-3515"},"institutions":[{"id":"https://openalex.org/I70931966","display_name":"Universit\u00e9 de Montr\u00e9al","ror":"https://ror.org/0161xgx34","country_code":"CA","type":"education","lineage":["https://openalex.org/I70931966"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Yoshua Bengio","raw_affiliation_strings":["Universite de Montreal"],"affiliations":[{"raw_affiliation_string":"Universite de Montreal","institution_ids":["https://openalex.org/I70931966"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5104083090"],"corresponding_institution_ids":["https://openalex.org/I70931966"],"apc_list":null,"apc_paid":null,"fwci":3.09,"has_fulltext":true,"cited_by_count":49,"citation_normalized_percentile":{"value":0.93066202,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"33","issue":"01","first_page":"3280","last_page":"3287"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9879000186920166,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.7007434368133545},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.6360259652137756},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.601814329624176},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.5996559262275696},{"id":"https://openalex.org/keywords/mechanism","display_name":"Mechanism (biology)","score":0.5384770035743713},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4488334357738495},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.4228218197822571},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.37469929456710815},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3534153699874878},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.13399001955986023},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.1298370659351349}],"concepts":[{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.7007434368133545},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.6360259652137756},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.601814329624176},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.5996559262275696},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.5384770035743713},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4488334357738495},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.4228218197822571},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.37469929456710815},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3534153699874878},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.13399001955986023},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.1298370659351349},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1609/aaai.v33i01.33013280","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v33i01.33013280","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4200/4078","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},{"id":"pmh:oai:publications.polymtl.ca:46832","is_oa":false,"landing_page_url":"https://publications.polymtl.ca/46832/","pdf_url":null,"source":{"id":"https://openalex.org/S4306401013","display_name":"PolyPublie (\u00c9cole Polytechnique de Montr\u00e9al)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45683168","host_organization_name":"Polytechnique Montr\u00e9al","host_organization_lineage":["https://openalex.org/I45683168"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article de revue"}],"best_oa_location":{"id":"doi:10.1609/aaai.v33i01.33013280","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v33i01.33013280","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4200/4078","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.6600000262260437,"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2904535507.pdf","grobid_xml":"https://content.openalex.org/works/W2904535507.grobid-xml"},"referenced_works_count":51,"referenced_works":["https://openalex.org/W194249466","https://openalex.org/W581956982","https://openalex.org/W1522301498","https://openalex.org/W1591706642","https://openalex.org/W1632114991","https://openalex.org/W1665214252","https://openalex.org/W1800356822","https://openalex.org/W1815076433","https://openalex.org/W1836465849","https://openalex.org/W1921523184","https://openalex.org/W1924770834","https://openalex.org/W2107878631","https://openalex.org/W2116261113","https://openalex.org/W2119717200","https://openalex.org/W2130942839","https://openalex.org/W2157331557","https://openalex.org/W2163605009","https://openalex.org/W2175402905","https://openalex.org/W2260756217","https://openalex.org/W2474920236","https://openalex.org/W2530887700","https://openalex.org/W2547718140","https://openalex.org/W2547875792","https://openalex.org/W2548228487","https://openalex.org/W2581719241","https://openalex.org/W2587753047","https://openalex.org/W2618530766","https://openalex.org/W2743945814","https://openalex.org/W2751304263","https://openalex.org/W2797349519","https://openalex.org/W2939265332","https://openalex.org/W2951605425","https://openalex.org/W2963627187","https://openalex.org/W2963703360","https://openalex.org/W2964043796","https://openalex.org/W4230563027","https://openalex.org/W4294521337","https://openalex.org/W4295373206","https://openalex.org/W4297827933","https://openalex.org/W4299838440","https://openalex.org/W4302375066","https://openalex.org/W4303633609","https://openalex.org/W6631190155","https://openalex.org/W6635590879","https://openalex.org/W6666761814","https://openalex.org/W6677408996","https://openalex.org/W6679436768","https://openalex.org/W6685537299","https://openalex.org/W6701650085","https://openalex.org/W6734848962","https://openalex.org/W6745491427"],"related_works":["https://openalex.org/W4225394202","https://openalex.org/W4298287631","https://openalex.org/W2953061907","https://openalex.org/W3032952384","https://openalex.org/W3034302643","https://openalex.org/W1847088711","https://openalex.org/W3036642985","https://openalex.org/W2964335273","https://openalex.org/W1889624880","https://openalex.org/W2229372569"],"abstract_inverted_index":{"Modelling":[0],"long-term":[1,120],"dependencies":[2],"is":[3,11,103],"a":[4,53,58,69,89,125],"challenge":[5],"for":[6],"recurrent":[7,60],"neural":[8],"networks.":[9],"This":[10],"primarily":[12],"due":[13],"to":[14,83],"the":[15,23,100,104,110],"fact":[16],"that":[17,66,99,107],"gradients":[18],"vanish":[19],"during":[20],"training,":[21],"as":[22],"sequence":[24],"length":[25],"increases.":[26],"Gradients":[27],"can":[28],"be":[29],"attenuated":[30,36],"by":[31,39,49],"transition":[32],"operators":[33],"and":[34,78,93,118],"are":[35],"or":[37],"dropped":[38],"activation":[40,76],"functions.":[41],"Canonical":[42],"architectures":[43],"like":[44],"LSTM":[45],"alleviate":[46,85],"this":[47],"issue":[48],"skipping":[50],"information":[51],"through":[52],"memory":[54,70],"mechanism.":[55],"We":[56],"propose":[57],"new":[59],"architecture":[61],"(Non-saturating":[62],"Recurrent":[63],"Unit;":[64],"NRU)":[65],"relies":[67],"on":[68],"mechanism":[71],"but":[72],"forgoes":[73],"both":[74],"saturating":[75,79],"functions":[77],"gates,":[80],"in":[81],"order":[82],"further":[84],"vanishing":[86],"gradients.":[87],"In":[88],"series":[90],"of":[91,127],"synthetic":[92],"real":[94],"world":[95],"tasks,":[96],"we":[97],"demonstrate":[98],"proposed":[101],"model":[102,106],"only":[105],"performs":[108],"among":[109],"top":[111],"2":[112],"models":[113],"across":[114],"all":[115],"tasks":[116],"with":[117],"without":[119],"dependencies,":[121],"when":[122],"compared":[123],"against":[124],"range":[126],"other":[128],"architectures.":[129]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":9},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":10},{"year":2020,"cited_by_count":9},{"year":2019,"cited_by_count":3}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
