{"id":"https://openalex.org/W4317609215","doi":"https://doi.org/10.3390/a16020068","title":"Inverse Reinforcement Learning as the Algorithmic Basis for Theory of Mind: Current Methods and Open Problems","display_name":"Inverse Reinforcement Learning as the Algorithmic Basis for Theory of Mind: Current Methods and Open Problems","publication_year":2023,"publication_date":"2023-01-19","ids":{"openalex":"https://openalex.org/W4317609215","doi":"https://doi.org/10.3390/a16020068"},"language":"en","primary_location":{"id":"doi:10.3390/a16020068","is_oa":true,"landing_page_url":"https://doi.org/10.3390/a16020068","pdf_url":"https://www.mdpi.com/1999-4893/16/2/68/pdf?version=1675246431","source":{"id":"https://openalex.org/S190629608","display_name":"Algorithms","issn_l":"1999-4893","issn":["1999-4893"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/1999-4893/16/2/68/pdf?version=1675246431","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054135227","display_name":"Jaime Ruiz-Serra","orcid":"https://orcid.org/0000-0002-0220-3253"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"The University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Jaime Ruiz-Serra","raw_affiliation_strings":["Modelling and Simulation Research Group, School of Computer Science, Faculty of Engineering, The University of Sydney, Sydney, NSW 2006, Australia"],"affiliations":[{"raw_affiliation_string":"Modelling and Simulation Research Group, School of Computer Science, Faculty of Engineering, The University of Sydney, Sydney, NSW 2006, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001069613","display_name":"Michael Harr\u00e9","orcid":"https://orcid.org/0000-0003-2199-2515"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"The University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Michael S. Harr\u00e9","raw_affiliation_strings":["Modelling and Simulation Research Group, School of Computer Science, Faculty of Engineering, The University of Sydney, Sydney, NSW 2006, Australia"],"affiliations":[{"raw_affiliation_string":"Modelling and Simulation Research Group, School of Computer Science, Faculty of Engineering, The University of Sydney, Sydney, NSW 2006, Australia","institution_ids":["https://openalex.org/I129604602"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5001069613"],"corresponding_institution_ids":["https://openalex.org/I129604602"],"apc_list":{"value":1400,"currency":"CHF","value_usd":1515},"apc_paid":{"value":1400,"currency":"CHF","value_usd":1515},"fwci":5.2056,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.94957323,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"16","issue":"2","first_page":"68","last_page":"68"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11252","display_name":"Evolutionary Game Theory and Cooperation","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11252","display_name":"Evolutionary Game Theory and Cooperation","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10656","display_name":"Child and Animal Learning Development","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12520","display_name":"Psychology of Moral and Emotional Judgment","score":0.9850999712944031,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.656840980052948},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6460518836975098},{"id":"https://openalex.org/keywords/theory-of-mind","display_name":"Theory of mind","score":0.5802180171012878},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.571481466293335},{"id":"https://openalex.org/keywords/cognitive-science","display_name":"Cognitive science","score":0.5336993932723999},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.5333751440048218},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5330950617790222},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5177223086357117},{"id":"https://openalex.org/keywords/cognition","display_name":"Cognition","score":0.4858819842338562},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.43264082074165344},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.2514686584472656},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.18207570910453796},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.13122692704200745}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.656840980052948},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6460518836975098},{"id":"https://openalex.org/C2779560602","wikidata":"https://www.wikidata.org/wiki/Q639219","display_name":"Theory of mind","level":3,"score":0.5802180171012878},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.571481466293335},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.5336993932723999},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.5333751440048218},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5330950617790222},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5177223086357117},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.4858819842338562},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.43264082074165344},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.2514686584472656},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.18207570910453796},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.13122692704200745},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.3390/a16020068","is_oa":true,"landing_page_url":"https://doi.org/10.3390/a16020068","pdf_url":"https://www.mdpi.com/1999-4893/16/2/68/pdf?version=1675246431","source":{"id":"https://openalex.org/S190629608","display_name":"Algorithms","issn_l":"1999-4893","issn":["1999-4893"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:7f0feea4e258439082b9b9d4411ba45b","is_oa":true,"landing_page_url":"https://doaj.org/article/7f0feea4e258439082b9b9d4411ba45b","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Algorithms, Vol 16, Iss 2, p 68 (2023)","raw_type":"article"},{"id":"pmh:oai:mdpi.com:/1999-4893/16/2/68/","is_oa":true,"landing_page_url":"https://dx.doi.org/10.3390/a16020068","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Algorithms; Volume 16; Issue 2; Pages: 68","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.3390/a16020068","is_oa":true,"landing_page_url":"https://doi.org/10.3390/a16020068","pdf_url":"https://www.mdpi.com/1999-4893/16/2/68/pdf?version=1675246431","source":{"id":"https://openalex.org/S190629608","display_name":"Algorithms","issn_l":"1999-4893","issn":["1999-4893"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.699999988079071,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4317609215.pdf"},"referenced_works_count":195,"referenced_works":["https://openalex.org/W46036898","https://openalex.org/W102873864","https://openalex.org/W173318062","https://openalex.org/W1482010531","https://openalex.org/W1533265907","https://openalex.org/W1559990548","https://openalex.org/W1591675293","https://openalex.org/W1652033540","https://openalex.org/W1801976851","https://openalex.org/W1877676982","https://openalex.org/W1975463331","https://openalex.org/W1979863024","https://openalex.org/W1984988829","https://openalex.org/W1999874108","https://openalex.org/W2010931158","https://openalex.org/W2022993718","https://openalex.org/W2023544307","https://openalex.org/W2031485595","https://openalex.org/W2031571562","https://openalex.org/W2032558547","https://openalex.org/W2044155094","https://openalex.org/W2051944318","https://openalex.org/W2069195348","https://openalex.org/W2070469928","https://openalex.org/W2097714468","https://openalex.org/W2098774185","https://openalex.org/W2100401322","https://openalex.org/W2101091849","https://openalex.org/W2102847492","https://openalex.org/W2105325351","https://openalex.org/W2105947986","https://openalex.org/W2106887613","https://openalex.org/W2107258367","https://openalex.org/W2109628722","https://openalex.org/W2113023245","https://openalex.org/W2113475501","https://openalex.org/W2116442740","https://openalex.org/W2117675763","https://openalex.org/W2118944179","https://openalex.org/W2119785746","https://openalex.org/W2124394479","https://openalex.org/W2125392972","https://openalex.org/W2125809125","https://openalex.org/W2127978988","https://openalex.org/W2128662472","https://openalex.org/W2132339352","https://openalex.org/W2133068870","https://openalex.org/W2141538250","https://openalex.org/W2144442672","https://openalex.org/W2145060720","https://openalex.org/W2145162803","https://openalex.org/W2147544021","https://openalex.org/W2151516755","https://openalex.org/W2156163138","https://openalex.org/W2162009473","https://openalex.org/W2162884436","https://openalex.org/W2169498096","https://openalex.org/W2177382477","https://openalex.org/W2180506980","https://openalex.org/W2181849516","https://openalex.org/W2197782092","https://openalex.org/W2211996086","https://openalex.org/W2252983464","https://openalex.org/W2270835334","https://openalex.org/W2275728380","https://openalex.org/W2277630443","https://openalex.org/W2290104316","https://openalex.org/W2323086467","https://openalex.org/W2338865890","https://openalex.org/W2402734324","https://openalex.org/W2404673495","https://openalex.org/W2410842990","https://openalex.org/W2431139695","https://openalex.org/W2466175722","https://openalex.org/W2479202353","https://openalex.org/W2518056776","https://openalex.org/W2525186327","https://openalex.org/W2549684528","https://openalex.org/W2562989799","https://openalex.org/W2567061106","https://openalex.org/W2571600439","https://openalex.org/W2572542433","https://openalex.org/W2572797343","https://openalex.org/W2594035753","https://openalex.org/W2626804490","https://openalex.org/W2740027066","https://openalex.org/W2751530711","https://openalex.org/W2753088790","https://openalex.org/W2758442112","https://openalex.org/W2785648274","https://openalex.org/W2788730383","https://openalex.org/W2793781162","https://openalex.org/W2794908222","https://openalex.org/W2804526344","https://openalex.org/W2806029332","https://openalex.org/W2857457978","https://openalex.org/W2885156179","https://openalex.org/W2891385160","https://openalex.org/W2892806280","https://openalex.org/W2898454860","https://openalex.org/W2909076020","https://openalex.org/W2913781869","https://openalex.org/W2928412166","https://openalex.org/W2939047085","https://openalex.org/W2948198309","https://openalex.org/W2949693231","https://openalex.org/W2949846483","https://openalex.org/W2962845991","https://openalex.org/W2962951365","https://openalex.org/W2963802910","https://openalex.org/W2964460729","https://openalex.org/W2970370999","https://openalex.org/W2971218263","https://openalex.org/W2992873857","https://openalex.org/W2995356893","https://openalex.org/W2997073681","https://openalex.org/W3008082783","https://openalex.org/W3025570388","https://openalex.org/W3027397596","https://openalex.org/W3037298378","https://openalex.org/W3037828308","https://openalex.org/W3046067727","https://openalex.org/W3049574859","https://openalex.org/W3081754649","https://openalex.org/W3087066227","https://openalex.org/W3094369551","https://openalex.org/W3103078873","https://openalex.org/W3107531409","https://openalex.org/W3118793806","https://openalex.org/W3121683757","https://openalex.org/W3122927161","https://openalex.org/W3124088714","https://openalex.org/W3127131455","https://openalex.org/W3130800560","https://openalex.org/W3134762820","https://openalex.org/W3135692815","https://openalex.org/W3137303899","https://openalex.org/W3138984732","https://openalex.org/W3140610361","https://openalex.org/W3162904728","https://openalex.org/W3167325792","https://openalex.org/W3167884978","https://openalex.org/W3169109844","https://openalex.org/W3170234019","https://openalex.org/W3171639171","https://openalex.org/W3175760761","https://openalex.org/W3199495358","https://openalex.org/W3200276130","https://openalex.org/W3204171449","https://openalex.org/W3205751250","https://openalex.org/W3206106208","https://openalex.org/W3206252238","https://openalex.org/W3206298348","https://openalex.org/W4210665702","https://openalex.org/W4210909794","https://openalex.org/W4213206621","https://openalex.org/W4214500342","https://openalex.org/W4223433337","https://openalex.org/W4225737910","https://openalex.org/W4232512588","https://openalex.org/W4246383594","https://openalex.org/W4252518712","https://openalex.org/W4283267980","https://openalex.org/W4283315089","https://openalex.org/W4285079896","https://openalex.org/W4287728432","https://openalex.org/W4291001103","https://openalex.org/W4292919149","https://openalex.org/W4297075189","https://openalex.org/W4298041823","https://openalex.org/W4298112127","https://openalex.org/W4302417474","https://openalex.org/W4309663019","https://openalex.org/W4381162568","https://openalex.org/W6629237864","https://openalex.org/W6634004297","https://openalex.org/W6635919148","https://openalex.org/W6639467748","https://openalex.org/W6645338893","https://openalex.org/W6677712025","https://openalex.org/W6696273291","https://openalex.org/W6718092244","https://openalex.org/W6738860160","https://openalex.org/W6748203849","https://openalex.org/W6750037401","https://openalex.org/W6772059344","https://openalex.org/W6779830860","https://openalex.org/W6796655947","https://openalex.org/W6797408272","https://openalex.org/W6797805595","https://openalex.org/W6797966628","https://openalex.org/W6798788696","https://openalex.org/W6838502310","https://openalex.org/W6903351479","https://openalex.org/W7027153383"],"related_works":["https://openalex.org/W4400868993","https://openalex.org/W3096874164","https://openalex.org/W1985560493","https://openalex.org/W2386410636","https://openalex.org/W2357975469","https://openalex.org/W2145363145","https://openalex.org/W1626977535","https://openalex.org/W4284974072","https://openalex.org/W2341346307","https://openalex.org/W3168977894"],"abstract_inverted_index":{"Theory":[0],"of":[1,102,116,118,151,170,182,189],"mind":[2],"(ToM)":[3],"is":[4,32,99],"the":[5,68,110,152,162,180,186],"psychological":[6,47],"construct":[7],"by":[8,106,142],"which":[9,107],"we":[10,18,53,166],"model":[11],"another\u2019s":[12],"internal":[13],"mental":[14],"states.":[15],"Through":[16],"ToM,":[17,52,138],"adjust":[19],"our":[20,35,92],"own":[21],"behaviour":[22,124],"to":[23,34,51,79,108],"best":[24],"suit":[25],"a":[26,46,100,114,119,127,134,148,168,190],"social":[27,84],"context,":[28],"and":[29,70,157,174,178],"therefore":[30],"it":[31],"essential":[33],"everyday":[36,93],"interactions":[37,85],"with":[38],"others.":[39],"In":[40],"adopting":[41],"an":[42],"algorithmic":[43,187],"(rather":[44],"than":[45],"or":[48],"neurological)":[49],"approach":[50,136],"gain":[54],"insights":[55],"into":[56],"cognition":[57],"that":[58],"will":[59,146],"aid":[60],"us":[61],"in":[62,83,91,126,192],"building":[63],"more":[64,81,89],"accurate":[65],"models":[66],"for":[67,137],"cognitive":[69],"behavioural":[71],"sciences,":[72],"as":[73,75,86,113,139,185],"well":[74],"enable":[76],"artificial":[77],"agents":[78],"be":[80],"proficient":[82],"they":[87],"become":[88],"embedded":[90],"lives.":[94],"Inverse":[95],"reinforcement":[96],"learning":[97,104],"(IRL)":[98],"class":[101],"machine":[103],"methods":[105,160],"infer":[109],"preferences":[111],"(rewards":[112],"function":[115],"state)":[117],"decision":[120,129],"maker":[121],"from":[122],"its":[123],"(trajectories":[125],"Markov":[128],"process).":[130],"IRL":[131,159,172,183],"can":[132],"provide":[133,167],"computational":[135],"recently":[140],"outlined":[141],"Jara-Ettinger,":[143],"but":[144],"this":[145],"require":[147],"better":[149],"understanding":[150],"relationship":[153],"between":[154],"ToM":[155,191],"concepts":[156,184],"existing":[158],"at":[161],"algorthmic":[163],"level.":[164],"Here,":[165],"review":[169],"prominent":[171],"algorithms":[173],"their":[175],"formal":[176],"descriptions,":[177],"discuss":[179],"applicability":[181],"basis":[188],"AI.":[193]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3}],"updated_date":"2026-03-30T08:08:38.191290","created_date":"2025-10-10T00:00:00"}
