{"id":"https://openalex.org/W4416286296","doi":"https://doi.org/10.1109/jiot.2025.3633765","title":"EIRM-RL: Epistemic Integrity Risk Monitoring Inspired Safe Reinforcement Learning for Trustworthy Autonomous Navigation","display_name":"EIRM-RL: Epistemic Integrity Risk Monitoring Inspired Safe Reinforcement Learning for Trustworthy Autonomous Navigation","publication_year":2025,"publication_date":"2025-11-17","ids":{"openalex":"https://openalex.org/W4416286296","doi":"https://doi.org/10.1109/jiot.2025.3633765"},"language":"en","primary_location":{"id":"doi:10.1109/jiot.2025.3633765","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2025.3633765","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Internet of Things Journal","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100320703","display_name":"Yuanyuan Zhang","orcid":"https://orcid.org/0009-0003-6451-4633"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Yuanyuan Zhang","raw_affiliation_strings":["Department of Aeronautical and Aviation Engineering and the Research Centre for Unmanned Autonomous System, The Hong Kong Polytechnic University, Hong Kong, SAR, China","Department of Aeronautical and Aviation Engineering, Hong Kong Polytechnic University, Hong Kong, SAR, China"],"affiliations":[{"raw_affiliation_string":"Department of Aeronautical and Aviation Engineering and the Research Centre for Unmanned Autonomous System, The Hong Kong Polytechnic University, Hong Kong, SAR, China","institution_ids":["https://openalex.org/I14243506"]},{"raw_affiliation_string":"Department of Aeronautical and Aviation Engineering, Hong Kong Polytechnic University, Hong Kong, SAR, China","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101479917","display_name":"Yingying Wang","orcid":"https://orcid.org/0000-0003-3293-0790"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Yingying Wang","raw_affiliation_strings":["Department of Aeronautical and Aviation Engineering and the Research Centre for Unmanned Autonomous System, The Hong Kong Polytechnic University, Hong Kong, SAR, China","Department of Aeronautical and Aviation Engineering, Hong Kong Polytechnic University, Hong Kong, SAR, China"],"affiliations":[{"raw_affiliation_string":"Department of Aeronautical and Aviation Engineering and the Research Centre for Unmanned Autonomous System, The Hong Kong Polytechnic University, Hong Kong, SAR, China","institution_ids":["https://openalex.org/I14243506"]},{"raw_affiliation_string":"Department of Aeronautical and Aviation Engineering, Hong Kong Polytechnic University, Hong Kong, SAR, China","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5045346492","display_name":"Weisong Wen","orcid":"https://orcid.org/0000-0003-4158-0913"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Weisong Wen","raw_affiliation_strings":["Department of Aeronautical and Aviation Engineering and the Research Centre for Unmanned Autonomous System, The Hong Kong Polytechnic University, Hong Kong, SAR, China","Department of Aeronautical and Aviation Engineering, Hong Kong Polytechnic University, Hong Kong, SAR, China"],"affiliations":[{"raw_affiliation_string":"Department of Aeronautical and Aviation Engineering and the Research Centre for Unmanned Autonomous System, The Hong Kong Polytechnic University, Hong Kong, SAR, China","institution_ids":["https://openalex.org/I14243506"]},{"raw_affiliation_string":"Department of Aeronautical and Aviation Engineering, Hong Kong Polytechnic University, Hong Kong, SAR, China","institution_ids":["https://openalex.org/I14243506"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100320703"],"corresponding_institution_ids":["https://openalex.org/I14243506"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.47038643,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"13","issue":"2","first_page":"3500","last_page":"3512"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10655","display_name":"GNSS positioning and interference","score":0.2939999997615814,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10655","display_name":"GNSS positioning and interference","score":0.2939999997615814,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11489","display_name":"Air Traffic Management and Optimization","score":0.15600000321865082,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.0617000013589859,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7361000180244446},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.612500011920929},{"id":"https://openalex.org/keywords/trustworthiness","display_name":"Trustworthiness","score":0.559499979019165},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.4690999984741211},{"id":"https://openalex.org/keywords/collision-avoidance","display_name":"Collision avoidance","score":0.428600013256073},{"id":"https://openalex.org/keywords/data-integrity","display_name":"Data integrity","score":0.3774999976158142},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.2840000092983246}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7361000180244446},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6970000267028809},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.612500011920929},{"id":"https://openalex.org/C153701036","wikidata":"https://www.wikidata.org/wiki/Q659974","display_name":"Trustworthiness","level":2,"score":0.559499979019165},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.4690999984741211},{"id":"https://openalex.org/C2780864053","wikidata":"https://www.wikidata.org/wiki/Q5147495","display_name":"Collision avoidance","level":3,"score":0.428600013256073},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.3961000144481659},{"id":"https://openalex.org/C33762810","wikidata":"https://www.wikidata.org/wiki/Q461671","display_name":"Data integrity","level":2,"score":0.3774999976158142},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34540000557899475},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.31360000371932983},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.2840000092983246},{"id":"https://openalex.org/C13687954","wikidata":"https://www.wikidata.org/wiki/Q4826847","display_name":"Autonomous agent","level":2,"score":0.2825999855995178},{"id":"https://openalex.org/C32896092","wikidata":"https://www.wikidata.org/wiki/Q189447","display_name":"Risk management","level":2,"score":0.28189998865127563},{"id":"https://openalex.org/C32230216","wikidata":"https://www.wikidata.org/wiki/Q7882499","display_name":"Uncertainty quantification","level":2,"score":0.27970001101493835},{"id":"https://openalex.org/C86369673","wikidata":"https://www.wikidata.org/wiki/Q1203659","display_name":"Simultaneous localization and mapping","level":4,"score":0.27730000019073486},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.27149999141693115},{"id":"https://openalex.org/C2776654903","wikidata":"https://www.wikidata.org/wiki/Q2601463","display_name":"SAFER","level":2,"score":0.26510000228881836},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.2581999897956848}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/jiot.2025.3633765","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2025.3633765","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Internet of Things Journal","raw_type":"journal-article"},{"id":"pmh:oai:ira.lib.polyu.edu.hk:10397/117727","is_oa":false,"landing_page_url":"http://hdl.handle.net/10397/117727","pdf_url":null,"source":{"id":"https://openalex.org/S4306400205","display_name":"PolyU Institutional Research Archive (Hong Kong Polytechnic University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I14243506","host_organization_name":"Hong Kong Polytechnic University","host_organization_lineage":["https://openalex.org/I14243506"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Journal/Magazine Article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W2082056119","https://openalex.org/W2162513948","https://openalex.org/W2999289476","https://openalex.org/W3122447121","https://openalex.org/W3176452384","https://openalex.org/W4220945937","https://openalex.org/W4226293621","https://openalex.org/W4375840665","https://openalex.org/W4375929150","https://openalex.org/W4383108357","https://openalex.org/W4383108450","https://openalex.org/W4386702654","https://openalex.org/W4386766811","https://openalex.org/W4386824909","https://openalex.org/W4387415195","https://openalex.org/W4392667254","https://openalex.org/W4394698794","https://openalex.org/W4395028520","https://openalex.org/W4395661371","https://openalex.org/W4398194910","https://openalex.org/W4401110597","https://openalex.org/W4401252052","https://openalex.org/W4401414310","https://openalex.org/W4401416449","https://openalex.org/W4403510960","https://openalex.org/W4403863433","https://openalex.org/W4405717468","https://openalex.org/W4406047022","https://openalex.org/W4408712150","https://openalex.org/W4409363140","https://openalex.org/W4409581235","https://openalex.org/W4411359041","https://openalex.org/W4412403975","https://openalex.org/W4412795708","https://openalex.org/W4415003074"],"related_works":[],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,69],"(RL)":[2],"has":[3],"shown":[4],"great":[5],"potential":[6],"for":[7,24],"autonomous":[8,75],"navigation":[9,54,76],"within":[10],"internet":[11],"of":[12,41],"things":[13],"(IoT)":[14],"environments,":[15],"where":[16],"various":[17],"and":[18,47,96,102,138,142,160],"changing":[19],"uncertainties":[20],"pose":[21],"significant":[22],"challenges":[23],"safe,":[25],"real-world":[26],"deployment.":[27],"Existing":[28],"safe":[29,165],"RL":[30,87,166],"methods":[31],"typically":[32],"employ":[33],"heuristic":[34],"constraints":[35],"while":[36,168],"neglecting":[37],"the":[38,81,106,132],"combined":[39],"impact":[40],"multiple":[42],"uncertainty":[43],"sources,":[44],"reducing":[45],"robustness":[46,161],"interpretability.":[48],"Drawing":[49],"on":[50],"concepts":[51],"from":[52],"global":[53],"satellite":[55],"system":[56],"(GNSS)":[57],"integrity":[58,65],"monitoring,":[59],"this":[60],"paper":[61],"proposes":[62],"an":[63,90,122],"epistemic":[64,103,112],"risk":[66,113],"monitoring":[67],"reinforcement":[68],"(EIRM-RL)":[70],"framework":[71,107],"to":[72,86,134,163],"enable":[73],"trustworthy":[74],"under":[77],"uncertainty.":[78,104],"EIRM-RL":[79,153],"extends":[80],"GNSS":[82],"protection":[83],"level":[84],"concept":[85],"by":[88],"utilizing":[89],"assembled":[91],"world":[92],"model":[93],"that":[94,152],"quantifies":[95],"incorporates":[97],"sensor":[98],"noise,":[99],"systematic":[100],"bias,":[101],"Furthermore,":[105],"continuously":[108],"monitors":[109],"a":[110],"dynamic":[111],"probability,":[114],"which":[115],"is":[116],"incorporated":[117],"into":[118],"policy":[119],"optimization":[120],"as":[121],"adaptive":[123],"safety":[124,141],"constraint":[125],"via":[126],"Lagrangian":[127],"duality.":[128],"This":[129],"method":[130],"enables":[131],"agent":[133],"proactively":[135],"avoid":[136],"hazards":[137],"effectively":[139],"balance":[140],"performance,":[143],"even":[144],"in":[145],"highly":[146],"uncertain":[147],"environments.":[148],"Extensive":[149],"experiments":[150],"demonstrate":[151],"achieves":[154],"superior":[155],"success":[156],"rates,":[157],"collision":[158],"avoidance,":[159],"compared":[162],"state-of-the-art":[164],"methods,":[167],"maintaining":[169],"high":[170],"efficiency.":[171]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-11-17T00:00:00"}
