{"id":"https://openalex.org/W4409233663","doi":"https://doi.org/10.1109/lra.2025.3558648","title":"Enhancing Robot Learning Through Cognitive Reasoning Trajectory Optimization Under Unknown Dynamics","display_name":"Enhancing Robot Learning Through Cognitive Reasoning Trajectory Optimization Under Unknown Dynamics","publication_year":2025,"publication_date":"2025-04-07","ids":{"openalex":"https://openalex.org/W4409233663","doi":"https://doi.org/10.1109/lra.2025.3558648"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2025.3558648","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2025.3558648","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5018809359","display_name":"Qingwei Dong","orcid":"https://orcid.org/0000-0002-6783-8647"},"institutions":[{"id":"https://openalex.org/I142078773","display_name":"Shenyang Institute of Automation","ror":"https://ror.org/00ft6nj33","country_code":"CN","type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Qingwei Dong","raw_affiliation_strings":["State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","State Key Laboratory of Robotics, Shenyang Institute of AutomationChinese Academy of Sciences"],"raw_orcid":"https://orcid.org/0000-0002-6783-8647","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"raw_affiliation_string":"State Key Laboratory of Robotics, Shenyang Institute of AutomationChinese Academy of Sciences","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Tingting Wu","orcid":"https://orcid.org/0009-0003-6982-6994"},"institutions":[{"id":"https://openalex.org/I180662265","display_name":"China Mobile (China)","ror":"https://ror.org/05gftfe97","country_code":"CN","type":"company","lineage":["https://openalex.org/I180662265"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tingting Wu","raw_affiliation_strings":["China Mobile Research Institute, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0003-6982-6994","affiliations":[{"raw_affiliation_string":"China Mobile Research Institute, Beijing, China","institution_ids":["https://openalex.org/I180662265"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067626781","display_name":"Peng Zeng","orcid":"https://orcid.org/0000-0001-7863-3260"},"institutions":[{"id":"https://openalex.org/I142078773","display_name":"Shenyang Institute of Automation","ror":"https://ror.org/00ft6nj33","country_code":"CN","type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peng Zeng","raw_affiliation_strings":["State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","State Key Laboratory of Robotics, Shenyang Institute of AutomationChinese Academy of Sciences"],"raw_orcid":"https://orcid.org/0000-0001-7863-3260","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"raw_affiliation_string":"State Key Laboratory of Robotics, Shenyang Institute of AutomationChinese Academy of Sciences","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089121136","display_name":"Chuanzhi Zang","orcid":null},"institutions":[{"id":"https://openalex.org/I157507598","display_name":"Shenyang University of Technology","ror":"https://ror.org/00d7f8730","country_code":"CN","type":"education","lineage":["https://openalex.org/I157507598"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chuanzhi zang","raw_affiliation_strings":["School of Artifcial Intelligence, Shenyang University of Technology, Shenyang, China","School of Artifcial Intelligence, Shenyang University of Technology, Liaoning, Shenyang, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Artifcial Intelligence, Shenyang University of Technology, Shenyang, China","institution_ids":["https://openalex.org/I157507598"]},{"raw_affiliation_string":"School of Artifcial Intelligence, Shenyang University of Technology, Liaoning, Shenyang, China","institution_ids":["https://openalex.org/I157507598"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079519256","display_name":"Guangxi Wan","orcid":"https://orcid.org/0000-0003-4456-6236"},"institutions":[{"id":"https://openalex.org/I142078773","display_name":"Shenyang Institute of Automation","ror":"https://ror.org/00ft6nj33","country_code":"CN","type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guangxi Wan","raw_affiliation_strings":["State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","State Key Laboratory of Robotics, Shenyang Institute of AutomationChinese Academy of Sciences"],"raw_orcid":"https://orcid.org/0000-0003-4456-6236","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"raw_affiliation_string":"State Key Laboratory of Robotics, Shenyang Institute of AutomationChinese Academy of Sciences","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":null,"display_name":"Shijie Cui","orcid":"https://orcid.org/0000-0002-3771-706X"},"institutions":[{"id":"https://openalex.org/I142078773","display_name":"Shenyang Institute of Automation","ror":"https://ror.org/00ft6nj33","country_code":"CN","type":"facility","lineage":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shijie Cui","raw_affiliation_strings":["State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","State Key Laboratory of Robotics, Shenyang Institute of AutomationChinese Academy of Sciences"],"raw_orcid":"https://orcid.org/0000-0002-3771-706X","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics, Shenyang Institute of Automation, Chinese Academy of Sciences, Shenyang, China","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]},{"raw_affiliation_string":"State Key Laboratory of Robotics, Shenyang Institute of AutomationChinese Academy of Sciences","institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5018809359"],"corresponding_institution_ids":["https://openalex.org/I142078773","https://openalex.org/I19820366"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0289471,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"10","issue":"6","first_page":"5401","last_page":"5408"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9179999828338623,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9179999828338623,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9144999980926514,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.6469449996948242},{"id":"https://openalex.org/keywords/cognition","display_name":"Cognition","score":0.6027095913887024},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5585805177688599},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5372445583343506},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5370345115661621},{"id":"https://openalex.org/keywords/dynamics","display_name":"Dynamics (music)","score":0.5289102792739868},{"id":"https://openalex.org/keywords/cognitive-robotics","display_name":"Cognitive robotics","score":0.41910016536712646},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.405966579914093},{"id":"https://openalex.org/keywords/cognitive-science","display_name":"Cognitive science","score":0.3631681501865387},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.2799113392829895},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.07024362683296204},{"id":"https://openalex.org/keywords/neuroscience","display_name":"Neuroscience","score":0.060652464628219604}],"concepts":[{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.6469449996948242},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.6027095913887024},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5585805177688599},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5372445583343506},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5370345115661621},{"id":"https://openalex.org/C145912823","wikidata":"https://www.wikidata.org/wiki/Q113558","display_name":"Dynamics (music)","level":2,"score":0.5289102792739868},{"id":"https://openalex.org/C192327766","wikidata":"https://www.wikidata.org/wiki/Q1038799","display_name":"Cognitive robotics","level":3,"score":0.41910016536712646},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.405966579914093},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.3631681501865387},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.2799113392829895},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.07024362683296204},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.060652464628219604},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lra.2025.3558648","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2025.3558648","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1068830511","display_name":null,"funder_award_id":"2024-MSBA-83","funder_id":"https://openalex.org/F4320323086","funder_display_name":"Natural Science Foundation of Liaoning Province"},{"id":"https://openalex.org/G1706880264","display_name":null,"funder_award_id":"92067205","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3067006959","display_name":null,"funder_award_id":"92267301","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G74403156","display_name":null,"funder_award_id":"92267205","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7588867604","display_name":null,"funder_award_id":"92367301","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320323086","display_name":"Natural Science Foundation of Liaoning Province","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W1587009522","https://openalex.org/W1738827650","https://openalex.org/W2060914855","https://openalex.org/W2126909264","https://openalex.org/W2129202194","https://openalex.org/W2221677593","https://openalex.org/W2580909119","https://openalex.org/W2962872206","https://openalex.org/W2963930274","https://openalex.org/W2968116426","https://openalex.org/W2997896361","https://openalex.org/W4205513846","https://openalex.org/W4224912544","https://openalex.org/W4383097638","https://openalex.org/W4385245566","https://openalex.org/W4387092545","https://openalex.org/W4388720459","https://openalex.org/W4388740223","https://openalex.org/W4389665935","https://openalex.org/W4393160302","https://openalex.org/W4393160795","https://openalex.org/W4393763811","https://openalex.org/W4396877948","https://openalex.org/W4399374221","https://openalex.org/W4406800520","https://openalex.org/W6682849425","https://openalex.org/W6736057607","https://openalex.org/W6740023956","https://openalex.org/W6741361698","https://openalex.org/W6769596995","https://openalex.org/W6796440922","https://openalex.org/W6809509765","https://openalex.org/W6809646742","https://openalex.org/W6839928859","https://openalex.org/W6851513886","https://openalex.org/W6853465110","https://openalex.org/W6854929498","https://openalex.org/W6862218055","https://openalex.org/W6867621267"],"related_works":["https://openalex.org/W2903025760","https://openalex.org/W4289147272","https://openalex.org/W1906023716","https://openalex.org/W2891970620","https://openalex.org/W1969477307","https://openalex.org/W2513760693","https://openalex.org/W1211648536","https://openalex.org/W1990035816","https://openalex.org/W2484031233","https://openalex.org/W4246694033"],"abstract_inverted_index":{"In":[0,155],"the":[1,9,36,47,51,57,89,126,134,149,207,213,225,229,233,236],"domain":[2],"of":[3,39,50,77,92,102,130,138,151,215,235],"robot":[4,52,227],"learning,":[5],"equipping":[6],"robots":[7],"with":[8,74,133,144,176,195],"capability":[10],"to":[11,46,83,173,180],"swiftly":[12],"acquire":[13],"operational":[14],"skills":[15],"poses":[16],"a":[17,75,93,160],"significant":[18],"challenge.":[19],"Currently,":[20],"reinforcement":[21,131],"learning":[22,132],"techniques":[23],"are":[24],"adept":[25],"at":[26],"addressing":[27],"dynamic,":[28],"unstructured":[29],"problems":[30],"involving":[31,116],"rich":[32,117],"contact":[33,118],"scenarios.":[34],"However,":[35],"convergence":[37],"rate":[38],"these":[40,72],"algorithms":[41],"is":[42],"often":[43],"slow":[44],"due":[45],"high":[48],"dimensionality":[49],"state-action":[53],"mapping":[54],"space":[55,210],"and":[56,104,140,200,211],"extensive":[58],"initial":[59,90],"policy":[60,142,152,208],"search":[61,143,209],"space.":[62],"Meanwhile,":[63],"advancements":[64],"in":[65,108,112,185,228],"large":[66],"language":[67],"models":[68,73,97,194],"(LLMs)":[69],"have":[70],"endowed":[71],"degree":[76],"logical":[78,136,178],"reasoning":[79,137,179,198],"ability,":[80],"enabling":[81],"them":[82],"take":[84],"goal-oriented":[85],"actions":[86],"proactively":[87],"during":[88],"phase":[91],"robotic":[94],"task.":[95],"These":[96],"can":[98],"implicitly":[99],"generate":[100],"features":[101],"states":[103],"uncover":[105],"underlying":[106],"patterns":[107],"trajectory":[109,216],"generation.":[110],"Yet,":[111],"complex":[113],"manipulative":[114,222],"tasks":[115,223],"scenarios,":[119],"LLMs":[120,175],"still":[121],"fall":[122],"short.":[123],"Thus,":[124],"integrating":[125],"robust":[127,177],"interactive":[128],"capabilities":[129],"strong":[135],"LLMs,":[139,145],"enhancing":[141],"could":[146],"potentially":[147],"accelerate":[148],"speed":[150],"searches":[153],"significantly.":[154],"this":[156,204],"paper,":[157],"we":[158],"introduce":[159],"Cognitive":[161,170],"Reasoning":[162],"Trajectory":[163],"Optimization":[164],"method.":[165],"This":[166],"approach":[167],"utilizes":[168],"Low-level":[169],"Control":[171],"Tuning":[172],"enable":[174],"make":[181],"effective":[182],"single-step":[183],"decisions":[184],"Markov":[186],"Decision":[187],"Process":[188],"(MDP)":[189],"tasks.":[190],"By":[191],"fitting":[192],"dynamic":[193],"high-quality":[196],"cognitive":[197],"data":[199],"optimizing":[201],"control":[202],"strategies,":[203],"method":[205],"constrains":[206],"enhances":[212],"efficiency":[214],"optimization.":[217],"Experimental":[218],"results":[219],"on":[220],"various":[221],"using":[224],"Sawyer":[226],"Mujoco":[230],"simulator":[231],"validate":[232],"effectiveness":[234],"proposed":[237],"algorithm.":[238]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
