{"id":"https://openalex.org/W4415399994","doi":"https://doi.org/10.1109/etfa65518.2025.11205530","title":"Safe reinforcement learning for ship energy management optimization with LLM-based reward shaping","display_name":"Safe reinforcement learning for ship energy management optimization with LLM-based reward shaping","publication_year":2025,"publication_date":"2025-09-09","ids":{"openalex":"https://openalex.org/W4415399994","doi":"https://doi.org/10.1109/etfa65518.2025.11205530"},"language":"en","primary_location":{"id":"doi:10.1109/etfa65518.2025.11205530","is_oa":false,"landing_page_url":"https://doi.org/10.1109/etfa65518.2025.11205530","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 30th International Conference on Emerging Technologies and Factory Automation (ETFA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://research.aalto.fi/en/publications/f3a8b0cf-6e9d-4e9e-8829-7325b2b6e2e3","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120084330","display_name":"Erald Shahinas","orcid":null},"institutions":[{"id":"https://openalex.org/I9927081","display_name":"Aalto University","ror":"https://ror.org/020hwjq30","country_code":"FI","type":"education","lineage":["https://openalex.org/I9927081"]}],"countries":["FI"],"is_corresponding":true,"raw_author_name":"Erald Shahinas","raw_affiliation_strings":["Aalto University,Department of Electrical Engineering and Automation,Espoo,Finland"],"affiliations":[{"raw_affiliation_string":"Aalto University,Department of Electrical Engineering and Automation,Espoo,Finland","institution_ids":["https://openalex.org/I9927081"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102049175","display_name":"Akira King","orcid":null},"institutions":[{"id":"https://openalex.org/I9927081","display_name":"Aalto University","ror":"https://ror.org/020hwjq30","country_code":"FI","type":"education","lineage":["https://openalex.org/I9927081"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Akira King","raw_affiliation_strings":["Aalto University,Department of Electrical Engineering and Automation,Espoo,Finland"],"affiliations":[{"raw_affiliation_string":"Aalto University,Department of Electrical Engineering and Automation,Espoo,Finland","institution_ids":["https://openalex.org/I9927081"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010935680","display_name":"Udayanto Dwi Atmojo","orcid":"https://orcid.org/0000-0002-6865-0806"},"institutions":[{"id":"https://openalex.org/I9927081","display_name":"Aalto University","ror":"https://ror.org/020hwjq30","country_code":"FI","type":"education","lineage":["https://openalex.org/I9927081"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Udayanto Dwi Atmojo","raw_affiliation_strings":["Aalto University,Department of Electrical Engineering and Automation,Espoo,Finland"],"affiliations":[{"raw_affiliation_string":"Aalto University,Department of Electrical Engineering and Automation,Espoo,Finland","institution_ids":["https://openalex.org/I9927081"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5120084330"],"corresponding_institution_ids":["https://openalex.org/I9927081"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.29215909,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12126","display_name":"Maritime Transport Emissions and Efficiency","score":0.9761999845504761,"subfield":{"id":"https://openalex.org/subfields/2305","display_name":"Environmental Engineering"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12126","display_name":"Maritime Transport Emissions and Efficiency","score":0.9761999845504761,"subfield":{"id":"https://openalex.org/subfields/2305","display_name":"Environmental Engineering"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10808","display_name":"Electric and Hybrid Vehicle Technologies","score":0.9569000005722046,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8560000061988831},{"id":"https://openalex.org/keywords/cruise-control","display_name":"Cruise control","score":0.5160999894142151},{"id":"https://openalex.org/keywords/energy-consumption","display_name":"Energy consumption","score":0.4959999918937683},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.45019999146461487},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.4343000054359436},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.41940000653266907},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.41780000925064087},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.41019999980926514}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8560000061988831},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5353999733924866},{"id":"https://openalex.org/C113168747","wikidata":"https://www.wikidata.org/wiki/Q507295","display_name":"Cruise control","level":3,"score":0.5160999894142151},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.4959999918937683},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.4652000069618225},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.45019999146461487},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.4343000054359436},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.41940000653266907},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.41780000925064087},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.41019999980926514},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.40610000491142273},{"id":"https://openalex.org/C45882903","wikidata":"https://www.wikidata.org/wiki/Q5042317","display_name":"Fuel efficiency","level":2,"score":0.4059999883174896},{"id":"https://openalex.org/C7817414","wikidata":"https://www.wikidata.org/wiki/Q1779504","display_name":"Energy management","level":3,"score":0.4032000005245209},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.40310001373291016},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.390500009059906},{"id":"https://openalex.org/C2778821358","wikidata":"https://www.wikidata.org/wiki/Q2063640","display_name":"Cruise","level":2,"score":0.3449999988079071},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.3395000100135803},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.3359000086784363},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.32749998569488525},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.31049999594688416},{"id":"https://openalex.org/C198783460","wikidata":"https://www.wikidata.org/wiki/Q629173","display_name":"Management system","level":2,"score":0.3025999963283539},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.26899999380111694},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.26499998569488525},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.26019999384880066},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.25290000438690186}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/etfa65518.2025.11205530","is_oa":false,"landing_page_url":"https://doi.org/10.1109/etfa65518.2025.11205530","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE 30th International Conference on Emerging Technologies and Factory Automation (ETFA)","raw_type":"proceedings-article"},{"id":"pmh:oai:aaltodoc.aalto.fi:123456789/141575","is_oa":true,"landing_page_url":"https://research.aalto.fi/en/publications/f3a8b0cf-6e9d-4e9e-8829-7325b2b6e2e3","pdf_url":null,"source":{"id":"https://openalex.org/S4306401663","display_name":"Aaltodoc (Aalto University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I9927081","host_organization_name":"Aalto University","host_organization_lineage":["https://openalex.org/I9927081"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"acceptedVersion"},{"id":"pmh:oai:zenodo.org:18629738","is_oa":true,"landing_page_url":"https://doi.org/10.1109/ETFA65518.2025.11205530","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"2025 IEEE 30th International Conference on Emerging Technologies and Factory Automation (ETFA), Porto-Portugal","raw_type":"info:eu-repo/semantics/other"}],"best_oa_location":{"id":"pmh:oai:aaltodoc.aalto.fi:123456789/141575","is_oa":true,"landing_page_url":"https://research.aalto.fi/en/publications/f3a8b0cf-6e9d-4e9e-8829-7325b2b6e2e3","pdf_url":null,"source":{"id":"https://openalex.org/S4306401663","display_name":"Aaltodoc (Aalto University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I9927081","host_organization_name":"Aalto University","host_organization_lineage":["https://openalex.org/I9927081"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"acceptedVersion"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Cruise":[0],"ships":[1],"are":[2],"large":[3,87,148],"greenhouse":[4],"gas":[5],"emitters.":[6],"Given":[7],"the":[8,16,70,105,108,193,196,200],"net-zero":[9],"emission":[10],"goal":[11],"by":[12,15],"2050":[13],"set":[14],"International":[17],"Maritime":[18],"Organization,":[19],"it":[20],"is":[21,34,58,111,204],"crucial":[22],"to":[23,35,42,69,84,86,123,141,152,182],"focus":[24,102],"on":[25,37,103],"different":[26],"strategies":[27],"for":[28,113,131],"reducing":[29,38,207],"emissions.":[30],"One":[31],"promising":[32,205],"strategy":[33],"work":[36,119],"energy":[39,50,56,93,133,171],"losses":[40],"due":[41],"non-optimal":[43],"management":[44,172],"of":[45,107,168,195],"a":[46,54,59,100,114,125,137,147,154,164,169,175],"cruise":[47],"ship\u2019s":[48,55,170],"complex":[49],"system.":[51],"Effectively":[52],"managing":[53],"consumption":[57],"difficult":[60],"task.":[61],"Modern":[62],"reinforcement":[63,96,127],"learning":[64,97,128],"approaches":[65,98],"have":[66,75],"been":[67],"employed":[68],"task":[71],"at":[72],"hand.":[73],"Results":[74],"shown":[76],"improvements":[77],"over":[78],"traditional":[79],"optimization":[80],"methods":[81],"that":[82,158,192],"fail":[83],"scale":[85],"stochastic":[88],"problems":[89],"such":[90],"as":[91,180],"ship":[92,132],"optimization.":[94,134],"However,":[95],"lack":[99],"direct":[101],"ensuring":[104],"safety":[106,139,160,197,208],"system,":[109],"which":[110],"critical":[112],"real-world":[115],"application.This":[116],"paper":[117],"showcases":[118],"in":[120,206],"progress":[121],"related":[122],"developing":[124],"safe":[126],"(RL)":[129],"framework":[130],"We":[135,162],"utilize":[136],"formal":[138],"shield":[140,198],"block":[142],"unsafe":[143],"control":[144],"actions":[145],"and":[146,174,184,199],"language":[149],"model":[150,179],"(LLM)":[151],"generate":[153],"reward":[155,202],"function":[156,203],"(RF)":[157],"incorporates":[159],"constraints.":[161],"construct":[163],"white-box":[165],"physical":[166],"system":[167,173],"faster":[176],"black-box":[177],"surrogate":[178],"environments":[181],"train":[183],"test":[185],"our":[186],"RL":[187],"methods.":[188],"Preliminary":[189],"results":[190],"show":[191],"integration":[194],"LLM-generated":[201],"violations.":[209]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-22T00:00:00"}
