{"id":"https://openalex.org/W4366381342","doi":"https://doi.org/10.1145/3584376.3584459","title":"TOCIM: An improved operant conditioning model with task-oriented curiosity","display_name":"TOCIM: An improved operant conditioning model with task-oriented curiosity","publication_year":2022,"publication_date":"2022-12-16","ids":{"openalex":"https://openalex.org/W4366381342","doi":"https://doi.org/10.1145/3584376.3584459"},"language":"en","primary_location":{"id":"doi:10.1145/3584376.3584459","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3584376.3584459","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 4th International Conference on Robotics, Intelligent Control and Artificial Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039494134","display_name":"Yufan Li","orcid":null},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yufan Li","raw_affiliation_strings":["Faculty of Information Technology, Beijing University of Technology, China"],"affiliations":[{"raw_affiliation_string":"Faculty of Information Technology, Beijing University of Technology, China","institution_ids":["https://openalex.org/I37796252"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017130874","display_name":"Jing Huang","orcid":"https://orcid.org/0000-0001-8804-7150"},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jing Huang","raw_affiliation_strings":["Faculty of Information Technology, Beijing University of Technology, China"],"affiliations":[{"raw_affiliation_string":"Faculty of Information Technology, Beijing University of Technology, China","institution_ids":["https://openalex.org/I37796252"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005182041","display_name":"Chenliang Lin","orcid":"https://orcid.org/0009-0006-2160-5916"},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chenliang Lin","raw_affiliation_strings":["Faculty of Information Technology, Beijing University of Technology, China"],"affiliations":[{"raw_affiliation_string":"Faculty of Information Technology, Beijing University of Technology, China","institution_ids":["https://openalex.org/I37796252"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5021105218","display_name":"Yazhou Lu","orcid":"https://orcid.org/0009-0004-3907-0396"},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yazhou Lu","raw_affiliation_strings":["Faculty of Information Technology, Beijing University of Technology, China"],"affiliations":[{"raw_affiliation_string":"Faculty of Information Technology, Beijing University of Technology, China","institution_ids":["https://openalex.org/I37796252"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5039494134"],"corresponding_institution_ids":["https://openalex.org/I37796252"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.21717362,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"457","last_page":"463"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14308","display_name":"Psychological and Educational Research Studies","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T14308","display_name":"Psychological and Educational Research Studies","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10656","display_name":"Child and Animal Learning Development","score":0.9323999881744385,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/curiosity","display_name":"Curiosity","score":0.8764397501945496},{"id":"https://openalex.org/keywords/novelty","display_name":"Novelty","score":0.713611364364624},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6230680346488953},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.605476975440979},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.5342015027999878},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.527823269367218},{"id":"https://openalex.org/keywords/action-selection","display_name":"Action selection","score":0.521674633026123},{"id":"https://openalex.org/keywords/orientation","display_name":"Orientation (vector space)","score":0.5108072757720947},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.5104395747184753},{"id":"https://openalex.org/keywords/associative-learning","display_name":"Associative learning","score":0.48327523469924927},{"id":"https://openalex.org/keywords/conditioning","display_name":"Conditioning","score":0.4728425145149231},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46157845854759216},{"id":"https://openalex.org/keywords/operant-conditioning","display_name":"Operant conditioning","score":0.45961636304855347},{"id":"https://openalex.org/keywords/preference","display_name":"Preference","score":0.44899433851242065},{"id":"https://openalex.org/keywords/matrix","display_name":"Matrix (chemical analysis)","score":0.43908652663230896},{"id":"https://openalex.org/keywords/cognitive-psychology","display_name":"Cognitive psychology","score":0.24479153752326965},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.24196240305900574},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2134886384010315},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.17569366097450256},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.13660961389541626},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.10227170586585999},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.10176783800125122},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08599880337715149}],"concepts":[{"id":"https://openalex.org/C33435437","wikidata":"https://www.wikidata.org/wiki/Q366791","display_name":"Curiosity","level":2,"score":0.8764397501945496},{"id":"https://openalex.org/C2778738651","wikidata":"https://www.wikidata.org/wiki/Q16546687","display_name":"Novelty","level":2,"score":0.713611364364624},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6230680346488953},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.605476975440979},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.5342015027999878},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.527823269367218},{"id":"https://openalex.org/C166109690","wikidata":"https://www.wikidata.org/wiki/Q4677422","display_name":"Action selection","level":3,"score":0.521674633026123},{"id":"https://openalex.org/C16345878","wikidata":"https://www.wikidata.org/wiki/Q107472979","display_name":"Orientation (vector space)","level":2,"score":0.5108072757720947},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.5104395747184753},{"id":"https://openalex.org/C2983526489","wikidata":"https://www.wikidata.org/wiki/Q133500","display_name":"Associative learning","level":2,"score":0.48327523469924927},{"id":"https://openalex.org/C45262634","wikidata":"https://www.wikidata.org/wiki/Q5159291","display_name":"Conditioning","level":2,"score":0.4728425145149231},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46157845854759216},{"id":"https://openalex.org/C163270606","wikidata":"https://www.wikidata.org/wiki/Q847079","display_name":"Operant conditioning","level":3,"score":0.45961636304855347},{"id":"https://openalex.org/C2781249084","wikidata":"https://www.wikidata.org/wiki/Q908656","display_name":"Preference","level":2,"score":0.44899433851242065},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.43908652663230896},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.24479153752326965},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.24196240305900574},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2134886384010315},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.17569366097450256},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.13660961389541626},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.10227170586585999},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.10176783800125122},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08599880337715149},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3584376.3584459","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3584376.3584459","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 4th International Conference on Robotics, Intelligent Control and Artificial Intelligence","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":3,"referenced_works":["https://openalex.org/W2170899200","https://openalex.org/W2269602391","https://openalex.org/W2484231675"],"related_works":["https://openalex.org/W4231562957","https://openalex.org/W96406935","https://openalex.org/W2483625864","https://openalex.org/W2239959725","https://openalex.org/W1999185412","https://openalex.org/W1415628142","https://openalex.org/W2055292374","https://openalex.org/W2120149263","https://openalex.org/W2055848231","https://openalex.org/W2169381998"],"abstract_inverted_index":{"As":[0,49],"an":[1],"important":[2],"type":[3],"of":[4,91,134,168,190],"associative":[5],"learning,":[6],"operation":[7],"conditioning":[8,28],"and":[9,118,145,154,170],"its":[10],"mathematical":[11],"models":[12,39,174],"have":[13,40,160,175],"been":[14,161,176],"studied":[15],"a":[16,41,50,75,88],"lot.":[17],"The":[18,83,178],"recent":[19],"trend":[20],"is":[21,85,127],"to":[22,29,54,61,69,150,164],"introduce":[23],"intrinsic":[24,37,79,125],"motivation":[25,38,80,126],"in":[26,148,156,187],"operant":[27],"expand":[30],"the":[31,56,66,71,124,132,135,140,143,146,166],"search":[32],"space.":[33],"However,":[34],"traditional":[35],"curiosity-based":[36],"strong":[42],"preference":[43],"for":[44],"those":[45],"states":[46,57,144],"seldomly":[47],"visited.":[48],"result,":[51],"they":[52],"intend":[53],"ignore":[55],"most":[58],"possibly":[59],"leading":[60],"target,":[62],"which":[63],"may":[64],"decrease":[65],"efficiency.":[67],"Aiming":[68],"solve":[70],"problem,":[72],"we":[73],"propose":[74],"task-oriented":[76],"curiosity":[77,111],"based":[78],"model":[81,84,184],"(TOCIM).":[82],"described":[86],"as":[87],"tuple":[89],"consisting":[90],"8":[92],"elements,":[93],"including":[94],"state":[95],"space":[96,99],"S,":[97],"action":[98,119],"A,":[100],"orientation":[101,104,114],"matrix":[102,109,112],"O,":[103],"function":[105],"V,":[106],"access":[107],"number":[108],"N,":[110],"C,":[113],"update":[115],"mechanism":[116],"e,":[117],"selection":[120],"strategy":[121],"G.":[122],"Here,":[123],"measured":[128],"not":[129],"only":[130],"by":[131,139],"novelty":[133],"sates,":[136],"but":[137],"also":[138],"correlation":[141],"between":[142],"target":[147],"order":[149],"trade":[151],"off":[152],"exploration":[153],"exploitation":[155],"navigation.":[157,191],"Simulation":[158],"experiments":[159],"carried":[162],"out":[163],"testify":[165],"validation":[167],"TOCIM,":[169],"some":[171],"other":[172],"similar":[173],"compared.":[177],"experiment":[179],"results":[180],"show":[181],"that":[182],"our":[183],"has":[185],"advantage":[186],"training":[188],"time":[189]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
