{"id":"https://openalex.org/W2788402229","doi":"https://doi.org/10.1109/icassp.2018.8461608","title":"High Order Recurrent Neural Networks for Acoustic Modelling","display_name":"High Order Recurrent Neural Networks for Acoustic Modelling","publication_year":2018,"publication_date":"2018-04-01","ids":{"openalex":"https://openalex.org/W2788402229","doi":"https://doi.org/10.1109/icassp.2018.8461608","mag":"2788402229"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2018.8461608","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2018.8461608","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007989522","display_name":"C. Zhang","orcid":"https://orcid.org/0000-0002-2173-6872"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"C. Zhang","raw_affiliation_strings":["Cambridge University Engineering Dept, Cambridge, U.K"],"affiliations":[{"raw_affiliation_string":"Cambridge University Engineering Dept, Cambridge, U.K","institution_ids":["https://openalex.org/I241749"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002191410","display_name":"Philip C. Woodland","orcid":"https://orcid.org/0000-0001-9069-0225"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"P. C. Woodland","raw_affiliation_strings":["Cambridge University Engineering Dept, Cambridge, U.K"],"affiliations":[{"raw_affiliation_string":"Cambridge University Engineering Dept, Cambridge, U.K","institution_ids":["https://openalex.org/I241749"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5007989522"],"corresponding_institution_ids":["https://openalex.org/I241749"],"apc_list":null,"apc_paid":null,"fwci":2.38274951,"has_fulltext":false,"cited_by_count":18,"citation_normalized_percentile":{"value":0.89176817,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"5849","last_page":"5853"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.9169220924377441},{"id":"https://openalex.org/keywords/sigmoid-function","display_name":"Sigmoid function","score":0.8290863037109375},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6844112873077393},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.66704261302948},{"id":"https://openalex.org/keywords/long-short-term-memory","display_name":"Long short term memory","score":0.6304678916931152},{"id":"https://openalex.org/keywords/layer","display_name":"Layer (electronics)","score":0.5615748167037964},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5437584519386292},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5101907253265381},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.4865245223045349},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4702647626399994},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4593603312969208},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.35957080125808716},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3300588130950928},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1941128671169281}],"concepts":[{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.9169220924377441},{"id":"https://openalex.org/C81388566","wikidata":"https://www.wikidata.org/wiki/Q526668","display_name":"Sigmoid function","level":3,"score":0.8290863037109375},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6844112873077393},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.66704261302948},{"id":"https://openalex.org/C133488467","wikidata":"https://www.wikidata.org/wiki/Q6673524","display_name":"Long short term memory","level":4,"score":0.6304678916931152},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.5615748167037964},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5437584519386292},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5101907253265381},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.4865245223045349},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4702647626399994},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4593603312969208},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.35957080125808716},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3300588130950928},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1941128671169281},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp.2018.8461608","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2018.8461608","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W196214544","https://openalex.org/W1517386993","https://openalex.org/W1815076433","https://openalex.org/W1924770834","https://openalex.org/W2027945811","https://openalex.org/W2032676284","https://openalex.org/W2036958054","https://openalex.org/W2064675550","https://openalex.org/W2070922095","https://openalex.org/W2097332485","https://openalex.org/W2103452139","https://openalex.org/W2107878631","https://openalex.org/W2129334286","https://openalex.org/W2131774270","https://openalex.org/W2145247325","https://openalex.org/W2194775991","https://openalex.org/W2288402171","https://openalex.org/W2293634267","https://openalex.org/W2345668077","https://openalex.org/W2401396087","https://openalex.org/W2407698769","https://openalex.org/W2510349098","https://openalex.org/W2564089970","https://openalex.org/W2682975603","https://openalex.org/W2734724284","https://openalex.org/W2746707458","https://openalex.org/W2935927048","https://openalex.org/W2953318193","https://openalex.org/W2962965465","https://openalex.org/W2963654251","https://openalex.org/W2963917928","https://openalex.org/W2964084166","https://openalex.org/W4254816979","https://openalex.org/W4294555862","https://openalex.org/W4300402905","https://openalex.org/W6607974698","https://openalex.org/W6638205174","https://openalex.org/W6638545294","https://openalex.org/W6640608466","https://openalex.org/W6679446661","https://openalex.org/W6687483927","https://openalex.org/W6696224498","https://openalex.org/W6696934422","https://openalex.org/W6713250295","https://openalex.org/W6713606482","https://openalex.org/W6725628136","https://openalex.org/W6730841103","https://openalex.org/W6739851064","https://openalex.org/W6748790474"],"related_works":["https://openalex.org/W2912153778","https://openalex.org/W4387163678","https://openalex.org/W4288108708","https://openalex.org/W2973430807","https://openalex.org/W4385280324","https://openalex.org/W2890685186","https://openalex.org/W2984436043","https://openalex.org/W4390245176","https://openalex.org/W2912831041","https://openalex.org/W3173606726"],"abstract_inverted_index":{"Vanishing":[0],"long-term":[1],"gradients":[2],"are":[3],"a":[4,63,119],"major":[5],"issue":[6],"in":[7],"training":[8],"standard":[9],"recurrent":[10,128],"neural":[11],"networks":[12],"(RNNs),":[13],"which":[14,68],"can":[15],"be":[16],"alleviated":[17],"by":[18,106],"long":[19],"short-term":[20],"memory":[21,25,34],"(LSTM)":[22],"models":[23],"with":[24,32,49],"cells.":[26],"However,":[27],"the":[28,33,50,58,89,111,127],"extra":[29],"parameters":[30,45,130],"associated":[31],"cells":[35],"mean":[36],"an":[37,47],"LSTM":[38,121],"layer":[39,129],"has":[40,69],"four":[41],"times":[42],"as":[43,46],"many":[44],"RNN":[48,66],"same":[51],"hidden":[52],"vector":[53],"size.":[54],"This":[55],"paper":[56],"addresses":[57],"vanishing":[59],"gradient":[60],"problem":[61],"using":[62,80,123],"high":[64],"order":[65],"(HORNN)":[67],"additional":[70],"connections":[71],"from":[72],"multiple":[73],"previous":[74],"time":[75],"steps.":[76],"Speech":[77],"recognition":[78],"experiments":[79],"British":[81],"English":[82],"multi-genre":[83],"broadcast":[84],"(MGB3)":[85],"data":[86],"showed":[87],"that":[88],"proposed":[90],"HORNN":[91],"architectures":[92],"for":[93],"rectified":[94],"linear":[95],"unit":[96],"and":[97,108,114,131],"sigmoid":[98],"activation":[99],"functions":[100],"reduced":[101],"word":[102],"error":[103],"rates":[104],"(WER)":[105],"4.2%":[107],"6.3%":[109],"over":[110],"corresponding":[112],"RNNs,":[113],"gave":[115],"similar":[116],"WERs":[117],"to":[118],"(projected)":[120],"while":[122],"only":[124],"20%-50%":[125],"of":[126],"computation.":[132]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
