{"id":"https://openalex.org/W7125894654","doi":"https://doi.org/10.1109/smc58881.2025.11342492","title":"Interpreting and Enhancing Decisions in Autonomous Navigation: A Belief-Desire-Intention Reinforcement Learning (BDI-RL) Approach","display_name":"Interpreting and Enhancing Decisions in Autonomous Navigation: A Belief-Desire-Intention Reinforcement Learning (BDI-RL) Approach","publication_year":2025,"publication_date":"2025-10-05","ids":{"openalex":"https://openalex.org/W7125894654","doi":"https://doi.org/10.1109/smc58881.2025.11342492"},"language":null,"primary_location":{"id":"doi:10.1109/smc58881.2025.11342492","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc58881.2025.11342492","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5065156490","display_name":"Adolfo Perrusqu\u00eda","orcid":"https://orcid.org/0000-0003-2290-1160"},"institutions":[{"id":"https://openalex.org/I82284825","display_name":"Cranfield University","ror":"https://ror.org/05cncd958","country_code":"GB","type":"education","lineage":["https://openalex.org/I82284825"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Adolfo Perrusqu\u00eda","raw_affiliation_strings":["Cranfield University,School of Aerospace, Transport and Manufacturing,Bedford,UK"],"affiliations":[{"raw_affiliation_string":"Cranfield University,School of Aerospace, Transport and Manufacturing,Bedford,UK","institution_ids":["https://openalex.org/I82284825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014006642","display_name":"Deepak Kumar Panda","orcid":"https://orcid.org/0000-0001-8835-3908"},"institutions":[{"id":"https://openalex.org/I82284825","display_name":"Cranfield University","ror":"https://ror.org/05cncd958","country_code":"GB","type":"education","lineage":["https://openalex.org/I82284825"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Deepak Panda","raw_affiliation_strings":["Cranfield University,School of Aerospace, Transport and Manufacturing,Bedford,UK"],"affiliations":[{"raw_affiliation_string":"Cranfield University,School of Aerospace, Transport and Manufacturing,Bedford,UK","institution_ids":["https://openalex.org/I82284825"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5085188653","display_name":"Weisi Guo","orcid":null},"institutions":[{"id":"https://openalex.org/I82284825","display_name":"Cranfield University","ror":"https://ror.org/05cncd958","country_code":"GB","type":"education","lineage":["https://openalex.org/I82284825"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Weisi Guo","raw_affiliation_strings":["Cranfield University,School of Aerospace, Transport and Manufacturing,Bedford,UK"],"affiliations":[{"raw_affiliation_string":"Cranfield University,School of Aerospace, Transport and Manufacturing,Bedford,UK","institution_ids":["https://openalex.org/I82284825"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5065156490"],"corresponding_institution_ids":["https://openalex.org/I82284825"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.83824715,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"5643","last_page":"5648"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.8637999892234802,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.8637999892234802,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.016899999231100082,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10525","display_name":"Human-Automation Interaction and Safety","score":0.013000000268220901,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7541000247001648},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.63919997215271},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.59170001745224},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.4880000054836273},{"id":"https://openalex.org/keywords/trustworthiness","display_name":"Trustworthiness","score":0.439300000667572},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.4027999937534332}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7541000247001648},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7211999893188477},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.63919997215271},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.59170001745224},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5717999935150146},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.4880000054836273},{"id":"https://openalex.org/C153701036","wikidata":"https://www.wikidata.org/wiki/Q659974","display_name":"Trustworthiness","level":2,"score":0.439300000667572},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.4027999937534332},{"id":"https://openalex.org/C65414064","wikidata":"https://www.wikidata.org/wiki/Q484105","display_name":"Autonomy","level":2,"score":0.40059998631477356},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37279999256134033},{"id":"https://openalex.org/C13687954","wikidata":"https://www.wikidata.org/wiki/Q4826847","display_name":"Autonomous agent","level":2,"score":0.3594000041484833},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3418000042438507},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3400000035762787},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.2752000093460083},{"id":"https://openalex.org/C34972735","wikidata":"https://www.wikidata.org/wiki/Q2920267","display_name":"Engineering design process","level":2,"score":0.25679999589920044},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.2524999976158142}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/smc58881.2025.11342492","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc58881.2025.11342492","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.4922851622104645,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320320005","display_name":"Royal Academy of Engineering","ror":"https://ror.org/0526snb40"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W129687690","https://openalex.org/W1544123977","https://openalex.org/W1875470631","https://openalex.org/W1996813382","https://openalex.org/W2056509413","https://openalex.org/W2240067561","https://openalex.org/W2282821441","https://openalex.org/W2962702317","https://openalex.org/W2962858109","https://openalex.org/W3036046236","https://openalex.org/W3130800560","https://openalex.org/W3157716083","https://openalex.org/W3182053794","https://openalex.org/W3206820790","https://openalex.org/W4206966378","https://openalex.org/W4226218930","https://openalex.org/W4386505803","https://openalex.org/W4388919215","https://openalex.org/W4392128889","https://openalex.org/W4394963598","https://openalex.org/W4399801349","https://openalex.org/W4401329608","https://openalex.org/W4403534639","https://openalex.org/W4404317177","https://openalex.org/W4404994176","https://openalex.org/W4407415444","https://openalex.org/W4410990663","https://openalex.org/W7124276366"],"related_works":[],"abstract_inverted_index":{"Explaining":[0],"autonomy":[1],"is":[2,25],"becoming":[3],"a":[4,76,88,131,154],"crucial":[5],"factor":[6],"in":[7,14,63,153],"the":[8,46,51,64,68,84,93,97,109,137,168,171],"design":[9,52],"of":[10,43,53,67,96,111,127,140,157,170],"trustworthy":[11],"autonomous":[12,36],"platforms":[13],"both":[15],"transport":[16],"and":[17,118,145,160],"smart":[18],"living":[19],"sectors.":[20],"Interpretable":[21],"reinforcement":[22],"learning":[23,94],"(RL)":[24],"an":[26,35,39],"emerging":[27],"research":[28],"area":[29],"that":[30,59,82,91,134],"aims":[31],"to":[32,166],"explain":[33],"why":[34],"platform":[37],"adopts":[38],"action":[40],"or":[41],"set":[42],"actions.":[44],"However,":[45],"state-of-the-art":[47],"has":[48],"focused":[49],"on":[50],"explainable":[54,85,122],"tools":[55],"as":[56,87,99,101,114,121],"independent":[57],"modules":[58],"are":[60,151,163],"not":[61],"involved":[62],"decision-making":[65],"process":[66,139],"RL":[69,79,98,116],"agent.":[70],"In":[71],"this":[72,105],"paper,":[73],"we":[74,107],"propose":[75],"novel":[77],"belief-desire-intention":[78],"(BDI-RL)":[80],"approach":[81],"incorporates":[83],"module":[86],"belief":[89,119],"model":[90,117,133],"enhances":[92],"capabilities":[95],"well":[100],"actions":[102],"interpretability.":[103],"To":[104],"end,":[106],"combine":[108],"merits":[110],"Dyna-Q":[112],"algorithm":[113],"backbone":[115],"maps":[120],"element.":[123],"The":[124],"combined":[125],"contribution":[126],"these":[128],"models":[129],"provides":[130],"robust":[132],"emulates":[135],"better":[136],"reasoning":[138],"humans":[141],"by":[142],"leveraging":[143],"beliefs":[144],"online":[146],"agent-environment":[147],"interactions.":[148],"Simulations":[149],"experiments":[150],"conducted":[152],"grid":[155],"environment":[156],"different":[158],"sizes":[159],"obstacles.":[161],"Comparisons":[162],"also":[164],"provided":[165],"show":[167],"benefits":[169],"proposed":[172],"methodology.":[173]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2026-01-29T00:00:00"}
