{"id":"https://openalex.org/W4401415635","doi":"https://doi.org/10.1109/cec60901.2024.10612166","title":"ROIL: Rule Optimization via Large Language Model for Imitation Learning","display_name":"ROIL: Rule Optimization via Large Language Model for Imitation Learning","publication_year":2024,"publication_date":"2024-06-30","ids":{"openalex":"https://openalex.org/W4401415635","doi":"https://doi.org/10.1109/cec60901.2024.10612166"},"language":"en","primary_location":{"id":"doi:10.1109/cec60901.2024.10612166","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/cec60901.2024.10612166","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE Congress on Evolutionary Computation (CEC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028392541","display_name":"Yossathorn Tianrungroj","orcid":null},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Yossathorn Tianrungroj","raw_affiliation_strings":["Graduate School of Information Science and Technology, The University of Tokyo,Tokyo,Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science and Technology, The University of Tokyo,Tokyo,Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005925953","display_name":"Hitoshi Iba","orcid":"https://orcid.org/0000-0001-7815-0306"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hitoshi Iba","raw_affiliation_strings":["Graduate School of Information Science and Technology, The University of Tokyo,Tokyo,Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science and Technology, The University of Tokyo,Tokyo,Japan","institution_ids":["https://openalex.org/I74801974"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5028392541"],"corresponding_institution_ids":["https://openalex.org/I74801974"],"apc_list":null,"apc_paid":null,"fwci":0.3637,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.65446313,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9801999926567078,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7626815438270569},{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.6310502290725708},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5146933197975159},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.40389952063560486},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.08166763186454773}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7626815438270569},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.6310502290725708},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5146933197975159},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.40389952063560486},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.08166763186454773},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cec60901.2024.10612166","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/cec60901.2024.10612166","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE Congress on Evolutionary Computation (CEC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.49000000953674316,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W1945616565","https://openalex.org/W1999128321","https://openalex.org/W2043003550","https://openalex.org/W2889787757","https://openalex.org/W2963961878","https://openalex.org/W3027879771","https://openalex.org/W3177813494","https://openalex.org/W4212774754","https://openalex.org/W4221143046","https://openalex.org/W4281557260","https://openalex.org/W4283828996","https://openalex.org/W4308244910","https://openalex.org/W4360836968","https://openalex.org/W4366735548","https://openalex.org/W4384616038","https://openalex.org/W4385245566","https://openalex.org/W4385574139","https://openalex.org/W4386081135","https://openalex.org/W4386554921","https://openalex.org/W4386566526","https://openalex.org/W4387635374","https://openalex.org/W4387838288","https://openalex.org/W4388139328","https://openalex.org/W4389520756","https://openalex.org/W6640425456","https://openalex.org/W6777615688","https://openalex.org/W6778883912","https://openalex.org/W6784429693","https://openalex.org/W6798182279","https://openalex.org/W6803991540","https://openalex.org/W6809646742","https://openalex.org/W6838865847","https://openalex.org/W6839827046","https://openalex.org/W6846254642","https://openalex.org/W6846556436","https://openalex.org/W6850886341","https://openalex.org/W6850936240","https://openalex.org/W6854010665","https://openalex.org/W6855425347","https://openalex.org/W6855844941","https://openalex.org/W6857154067","https://openalex.org/W6857359116"],"related_works":["https://openalex.org/W4387497383","https://openalex.org/W3183948672","https://openalex.org/W3173606202","https://openalex.org/W3110381201","https://openalex.org/W2948807893","https://openalex.org/W2778153218","https://openalex.org/W2758277628","https://openalex.org/W2748952813","https://openalex.org/W1531601525","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Recent":[0],"improvements":[1],"in":[2,12,26,57,69,85,126,135,186],"pretrained":[3],"Large":[4],"Language":[5],"Models":[6],"(LLMs)":[7],"have":[8],"demonstrated":[9],"increasing":[10],"capabilities":[11,54],"various":[13],"natural":[14,58,70],"language":[15,59],"processing":[16],"tasks,":[17],"such":[18],"as":[19],"instruction":[20],"following.":[21],"However,":[22],"effectively":[23],"utilizing":[24],"LLMs":[25,80,95],"interactive":[27,87],"environments":[28],"that":[29],"require":[30],"advanced":[31],"reasoning,":[32],"planning,":[33],"and":[34,111,115,151],"decision-making":[35],"skills":[36,125],"remains":[37],"a":[38,74,139,148,155,163],"challenge.":[39],"In":[40],"this":[41,169,187],"study,":[42],"we":[43,72],"integrate":[44],"Learning":[45,83],"Classifier":[46],"Systems":[47],"(LCS)":[48],"with":[49],"LLMs,":[50],"thereby":[51],"extending":[52],"their":[53],"to":[55,96,162],"interact":[56],"domains.":[60],"To":[61],"accommodate":[62],"the":[63,66,105,120,131,136,172],"integration,":[64],"especially":[65],"rule":[67,91],"represented":[68],"language,":[71],"propose":[73],"novel":[75],"Rule":[76],"Optimization":[77],"method":[78,146],"using":[79,176],"for":[81,107,183],"Imitation":[82],"(ROIL)":[84],"text-based":[86,140],"environments.":[88,128],"ROIL":[89,134,175],"addresses":[90],"learning":[92,109,123,166],"by":[93],"lever-aging":[94],"optimize":[97],"rules":[98],"based":[99],"on":[100],"human":[101],"demonstrations,":[102],"thus":[103],"eliminating":[104],"need":[106],"trial-and-error":[108],"processes":[110],"ensuring":[112],"both":[113],"interpretability":[114],"safety.":[116],"It":[117],"also":[118],"tackles":[119],"challenge":[121],"of":[122,133,174],"transferable":[124],"these":[127],"We":[129],"evaluate":[130],"efficacy":[132],"WebShop":[137],"environment,":[138],"e-commerce":[141],"website":[142],"navigation":[143],"problem.":[144],"The":[145],"achieved":[147],"significant":[149],"performance":[150,160],"efficiency":[152],"improvement":[153],"over":[154],"strong":[156],"baseline,":[157],"while":[158],"demonstrating":[159],"close":[161],"gradient-based":[164],"imitation":[165],"approach.":[167],"Additionally,":[168],"study":[170],"explores":[171],"enhancement":[173],"meta-heuristic":[177],"optimization":[178],"algorithms,":[179],"providing":[180],"foundational":[181],"research":[182],"further":[184],"investigation":[185],"area.":[188]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-01-13T01:12:25.745995","created_date":"2025-10-10T00:00:00"}
