{"id":"https://openalex.org/W4408236101","doi":"https://doi.org/10.1109/robio64047.2024.10907647","title":"OFSLMs: Offline Fine-Tuned Small Language Models Based on Hybrid Synthetic Knowledge for Robot Introspective Decision-Making","display_name":"OFSLMs: Offline Fine-Tuned Small Language Models Based on Hybrid Synthetic Knowledge for Robot Introspective Decision-Making","publication_year":2024,"publication_date":"2024-12-10","ids":{"openalex":"https://openalex.org/W4408236101","doi":"https://doi.org/10.1109/robio64047.2024.10907647"},"language":"en","primary_location":{"id":"doi:10.1109/robio64047.2024.10907647","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio64047.2024.10907647","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Robotics and Biomimetics (ROBIO)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100306278","display_name":"Jinbiao Zhu","orcid":null},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jinbiao Zhu","raw_affiliation_strings":["Northeastern University,Faculty of Robot Science and Engineering,Shenyang,Liaoning Province,China"],"affiliations":[{"raw_affiliation_string":"Northeastern University,Faculty of Robot Science and Engineering,Shenyang,Liaoning Province,China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115593838","display_name":"Lishan Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lishan Wang","raw_affiliation_strings":["Northeastern University,Faculty of Robot Science and Engineering,Shenyang,Liaoning Province,China"],"affiliations":[{"raw_affiliation_string":"Northeastern University,Faculty of Robot Science and Engineering,Shenyang,Liaoning Province,China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116553336","display_name":"Yi Guc","orcid":null},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yi Guc","raw_affiliation_strings":["Northeastern University,Faculty of Robot Science and Engineering,Shenyang,Liaoning Province,China"],"affiliations":[{"raw_affiliation_string":"Northeastern University,Faculty of Robot Science and Engineering,Shenyang,Liaoning Province,China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100455750","display_name":"Fei Wang","orcid":"https://orcid.org/0000-0001-8432-0009"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fei Wang","raw_affiliation_strings":["Northeastern University,Faculty of Robot Science and Engineering,Shenyang,Liaoning Province,China"],"affiliations":[{"raw_affiliation_string":"Northeastern University,Faculty of Robot Science and Engineering,Shenyang,Liaoning Province,China","institution_ids":["https://openalex.org/I9224756"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100306278"],"corresponding_institution_ids":["https://openalex.org/I9224756"],"apc_list":null,"apc_paid":null,"fwci":0.3626,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.71354859,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1839","last_page":"1844"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9937000274658203,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9624000191688538,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/introspection","display_name":"Introspection","score":0.8916681408882141},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7254993319511414},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6605714559555054},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5039169192314148},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.43048447370529175},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.10882151126861572},{"id":"https://openalex.org/keywords/cognitive-psychology","display_name":"Cognitive psychology","score":0.07263749837875366}],"concepts":[{"id":"https://openalex.org/C129671850","wikidata":"https://www.wikidata.org/wiki/Q210501","display_name":"Introspection","level":2,"score":0.8916681408882141},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7254993319511414},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6605714559555054},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5039169192314148},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.43048447370529175},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.10882151126861572},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.07263749837875366}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/robio64047.2024.10907647","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio64047.2024.10907647","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Robotics and Biomimetics (ROBIO)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6600000262260437,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G721033653","display_name":null,"funder_award_id":"62373086,62373087","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":5,"referenced_works":["https://openalex.org/W4385570088","https://openalex.org/W4390099692","https://openalex.org/W4391128534","https://openalex.org/W4394828156","https://openalex.org/W4401553778"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W4387404794","https://openalex.org/W2380479582","https://openalex.org/W4387405288","https://openalex.org/W4387404506","https://openalex.org/W2084234399","https://openalex.org/W4387405632","https://openalex.org/W2500774003"],"abstract_inverted_index":{"The":[0],"combination":[1],"of":[2,84,153,192],"robots":[3,72],"with":[4,53,76,107],"large":[5],"language":[6,165],"models":[7,63,166,173,214],"(LLMs)":[8],"offers":[9],"the":[10,59,65,144,151,154,160,170,189,193,198,224],"potential":[11],"to":[12,117,122,142,226],"create":[13,201],"more":[14],"intelligent":[15],"systems,":[16],"a":[17,94,102,138],"prospect":[18],"that":[19,71,197,206],"has":[20],"garnered":[21],"attention":[22],"from":[23],"researchers":[24],"in":[25,218,244],"recent":[26,161],"years.":[27],"Current":[28],"efforts":[29],"primarily":[30],"focus":[31],"on":[32,132,182],"constructing":[33],"prompt":[34],"systems":[35],"through":[36],"online":[37],"APIs":[38],"and":[39,44,57,64,100,109,119,125,156,167,187,205,231],"high-level":[40],"natural":[41],"language-based":[42],"planning":[43],"decision-making":[45,230],"offline.":[46,88],"However,":[47],"these":[48,98,183],"approaches":[49],"often":[50],"neglect":[51],"scenarios":[52],"weak":[54],"network":[55],"connectivity":[56],"downplay":[58],"close":[60],"integration":[61],"between":[62],"robot's":[66],"lower-level":[67,126],"control.":[68],"We":[69,177],"propose":[70],"should":[73],"be":[74],"equipped":[75],"Offline":[77],"Fine-tuned":[78],"Small":[79],"Language":[80],"Models":[81],"(OFSLMs)":[82],"capable":[83],"generating":[85],"introspective":[86],"decisions":[87],"To":[89],"this":[90],"end,":[91],"we":[92,136,149,158,200],"design":[93],"workflow":[95,209],"for":[96],"creating":[97],"OFSLMs":[99,121,222,239],"develop":[101],"hybrid":[103],"synthetic":[104],"fine-tuning":[105],"dataset":[106,113,199],"human":[108],"GPT-4's":[110],"annotation.":[111],"This":[112],"contains":[114],"2,663":[115],"cases":[116],"train":[118],"evaluate":[120],"generate":[123,232],"\u201cplan\u201d":[124],"control":[127,233],"codes":[128],"called":[129],"\u201csolution\u201d":[130],"based":[131],"given":[133],"\u201cinstruction.\u201d":[134],"Additionally,":[135],"devise":[137],"two-stage":[139],"evaluation":[140],"method":[141],"select":[143,159],"best":[145,171],"OFSLMs.":[146,194,212],"In":[147],"experiments,":[148],"analyze":[150],"distribution":[152],"dataset,":[155],"then":[157],"9":[162],"open-source":[163],"small":[164],"filter":[168],"out":[169],"3":[172],"using":[174],"proposed":[175,208],"workflow.":[176],"further":[178],"perform":[179,227],"nonlinear":[180],"fitting":[181],"OFSLMs'":[184],"numerical":[185],"metrics,":[186],"explore":[188],"generalization":[190,251],"capabilities":[191],"Experiments":[195],"demonstrate":[196,223],"is":[202],"semantically":[203],"rich":[204],"our":[207,221],"yields":[210],"high-quality":[211],"These":[213],"exhibit":[215],"non-linear":[216],"growth":[217],"metrics.":[219],"Moreover,":[220],"ability":[225],"offline":[228],"robot":[229],"code,":[234],"highlighting":[235],"their":[236,250],"specialization;":[237],"simultaneously,":[238],"also":[240],"show":[241],"comparable":[242],"performance":[243],"non-decision-related":[245],"text-based":[246],"question-answering":[247],"tasks,":[248],"indicating":[249],"capability.":[252]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-28T23:10:05.387466","created_date":"2025-10-10T00:00:00"}
