{"id":"https://openalex.org/W7139914734","doi":"https://doi.org/10.1016/j.procs.2026.01.068","title":"Hierarchical Recurrent Neural Networks with Bayesian Dropout for Long-Sequence Language Modeling Tasks","display_name":"Hierarchical Recurrent Neural Networks with Bayesian Dropout for Long-Sequence Language Modeling Tasks","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7139914734","doi":"https://doi.org/10.1016/j.procs.2026.01.068"},"language":"en","primary_location":{"id":"doi:10.1016/j.procs.2026.01.068","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.068","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1016/j.procs.2026.01.068","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5066371991","display_name":"Khaled Abuhmaidan","orcid":"https://orcid.org/0000-0003-2346-6201"},"institutions":[{"id":"https://openalex.org/I45998257","display_name":"Sohar University","ror":"https://ror.org/02ftvf862","country_code":"OM","type":"education","lineage":["https://openalex.org/I45998257"]}],"countries":["OM"],"is_corresponding":false,"raw_author_name":"Khaled Abuhmaidan","raw_affiliation_strings":["Faculty of computing and IT, Sohar University, Oman"],"affiliations":[{"raw_affiliation_string":"Faculty of computing and IT, Sohar University, Oman","institution_ids":["https://openalex.org/I45998257"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5037528486","display_name":"Taher M. Ghazal","orcid":"https://orcid.org/0000-0003-0672-7924"},"institutions":[{"id":"https://openalex.org/I885383172","display_name":"National University of Malaysia","ror":"https://ror.org/00bw8d226","country_code":"MY","type":"education","lineage":["https://openalex.org/I885383172"]}],"countries":["MY"],"is_corresponding":true,"raw_author_name":"Taher M. Ghazal","raw_affiliation_strings":["Faculty of Computing and IT, Sohar University, Oman, Department of Networks and Cybersecurity, Hourani Center for Applied Scientific Research, Al-Ahliyya Amman University, Amman, Jordan. Center for Cyber Security, Faculty of Information Science and Technology, Universiti Kebangsaan Malaysia (UKM), 43600 Bangi, Selangor, Malaysia"],"affiliations":[{"raw_affiliation_string":"Faculty of Computing and IT, Sohar University, Oman, Department of Networks and Cybersecurity, Hourani Center for Applied Scientific Research, Al-Ahliyya Amman University, Amman, Jordan. Center for Cyber Security, Faculty of Information Science and Technology, Universiti Kebangsaan Malaysia (UKM), 43600 Bangi, Selangor, Malaysia","institution_ids":["https://openalex.org/I885383172"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5037528486"],"corresponding_institution_ids":["https://openalex.org/I885383172"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.92994441,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":"275","issue":null,"first_page":"584","last_page":"593"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3677999973297119,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3677999973297119,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.11029999703168869,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.06129999831318855,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.8313000202178955},{"id":"https://openalex.org/keywords/dropout","display_name":"Dropout (neural networks)","score":0.7595999836921692},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.5620999932289124},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.4912000000476837},{"id":"https://openalex.org/keywords/bayesian-network","display_name":"Bayesian network","score":0.4675000011920929},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.3869999945163727}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.923799991607666},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.8313000202178955},{"id":"https://openalex.org/C2776145597","wikidata":"https://www.wikidata.org/wiki/Q25339462","display_name":"Dropout (neural networks)","level":2,"score":0.7595999836921692},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6625999808311462},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.5620999932289124},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5382000207901001},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.4912000000476837},{"id":"https://openalex.org/C33724603","wikidata":"https://www.wikidata.org/wiki/Q812540","display_name":"Bayesian network","level":2,"score":0.4675000011920929},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3869999945163727},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3456000089645386},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.3393000066280365},{"id":"https://openalex.org/C144986985","wikidata":"https://www.wikidata.org/wiki/Q871236","display_name":"Hierarchical database model","level":2,"score":0.336899995803833},{"id":"https://openalex.org/C82142266","wikidata":"https://www.wikidata.org/wiki/Q3456604","display_name":"Dynamic Bayesian network","level":3,"score":0.31049999594688416},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.27649998664855957},{"id":"https://openalex.org/C71983512","wikidata":"https://www.wikidata.org/wiki/Q7915687","display_name":"Variable-order Bayesian network","level":4,"score":0.2689000070095062},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2590000033378601},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.258899986743927}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1016/j.procs.2026.01.068","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.068","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1016/j.procs.2026.01.068","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.068","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.5187859535217285,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W4296990089","https://openalex.org/W4297105455","https://openalex.org/W4377103821","https://openalex.org/W4384404790","https://openalex.org/W4390188880","https://openalex.org/W4391012104","https://openalex.org/W4391718339","https://openalex.org/W4398225275","https://openalex.org/W4400053775","https://openalex.org/W4401243645","https://openalex.org/W4401580665","https://openalex.org/W4402568227","https://openalex.org/W4403246534","https://openalex.org/W4403299787","https://openalex.org/W4403799627","https://openalex.org/W4404201390","https://openalex.org/W4406177305","https://openalex.org/W4406219481","https://openalex.org/W4406242189","https://openalex.org/W4407030003","https://openalex.org/W4407466527","https://openalex.org/W4407595200","https://openalex.org/W4407935339","https://openalex.org/W4408477302","https://openalex.org/W4408695113","https://openalex.org/W4408697418","https://openalex.org/W4408729471","https://openalex.org/W4408788024","https://openalex.org/W4409014333","https://openalex.org/W4409347060","https://openalex.org/W4409426354","https://openalex.org/W4409510989","https://openalex.org/W4409831904","https://openalex.org/W4410049551","https://openalex.org/W4410083667","https://openalex.org/W4414085369"],"related_works":[],"abstract_inverted_index":{"Statistical":[0],"and":[1,29,67,94,138,147,195],"neural":[2],"language":[3,49,186],"models":[4],"continue":[5],"to":[6,19,91,101,111],"struggle":[7],"with":[8,42,125,132,154,174],"modeling":[9,50,162],"long-sequence":[10,48,185],"dependencies":[11],"in":[12,22,141,184],"natural":[13],"language.":[14],"This":[15,32,188],"is":[16,84],"primarily":[17],"due":[18],"challenges":[20],"inherent":[21],"recurrent":[23,56,106],"architectures,":[24],"including":[25],"vanishing":[26],"gradients,":[27],"overfitting,":[28],"limited":[30,117],"generalization.":[31],"work":[33],"presents":[34],"a":[35,87],"Hierarchical":[36],"Recurrent":[37],"Neural":[38],"Network":[39],"framework":[40],"enhanced":[41],"Bayesian":[43,82,133,175],"dropout":[44,83,134],"(HRNN-BD)":[45],"for":[46,160],"resilient":[47],"applications.":[51],"The":[52,61,166],"proposed":[53],"architecture":[54],"arranges":[55],"layers":[57,63,73],"into":[58],"hierarchical":[59,151,171],"levels.":[60],"lower":[62],"capture":[64],"short-term":[65],"lexical":[66],"grammatical":[68],"relationships,":[69],"while":[70,157],"the":[71,99,130,150,179,182],"higher":[72],"encode":[74],"longer,":[75],"contextual":[76],"patterns":[77],"that":[78,129,169],"span":[79],"longer":[80],"sequences.":[81],"employed":[85],"as":[86],"principled":[88],"regularization":[89,176],"method":[90],"address":[92],"overfitting":[93],"uncertainty":[95],"estimation.":[96],"It":[97],"enables":[98],"model":[100],"approximate":[102],"posterior":[103],"distributions":[104],"over":[105],"weights,":[107],"improving":[108],"its":[109],"ability":[110],"generalize":[112],"when":[113],"training":[114],"data":[115],"are":[116],"or":[118],"noisy.":[119],"Evaluations":[120],"performed":[121],"on":[122],"benchmark":[123],"datasets":[124],"long-text":[126],"corpora":[127],"demonstrate":[128],"HRNN":[131],"outperforms":[135],"traditional":[136],"LSTM":[137],"GRU":[139],"baselines":[140],"terms":[142],"of":[143,163,181],"perplexity,":[144],"sequence":[145],"coherence,":[146],"robustness.":[148],"Furthermore,":[149],"design":[152],"assists":[153],"memory":[155],"constraints":[156],"still":[158],"allowing":[159],"efficient":[161],"vast":[164],"entities.":[165],"results":[167],"show":[168],"combining":[170],"temporal":[172],"abstraction":[173],"can":[177,190],"enhance":[178],"state":[180],"art":[183],"modeling.":[187],"approach":[189],"support":[191],"document":[192],"generation,":[193],"summarization,":[194],"automated":[196],"translation.":[197]},"counts_by_year":[],"updated_date":"2026-03-22T06:25:25.174409","created_date":"2026-03-21T00:00:00"}
