{"id":"https://openalex.org/W4381573046","doi":"https://doi.org/10.48550/arxiv.2306.11128","title":"CAMMARL: Conformal Action Modeling in Multi Agent Reinforcement Learning","display_name":"CAMMARL: Conformal Action Modeling in Multi Agent Reinforcement Learning","publication_year":2023,"publication_date":"2023-06-19","ids":{"openalex":"https://openalex.org/W4381573046","doi":"https://doi.org/10.48550/arxiv.2306.11128"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2306.11128","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.11128","pdf_url":"https://arxiv.org/pdf/2306.11128","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2306.11128","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100311114","display_name":"Nikunj Gupta","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Gupta, Nikunj","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032466547","display_name":"Samira Ebrahimi Kahou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nath, Somjit","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Kahou, Samira Ebrahimi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kahou, Samira Ebrahimi","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100311114"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.625,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.625,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.6543067097663879},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5700756311416626},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.5359848737716675},{"id":"https://openalex.org/keywords/conformal-map","display_name":"Conformal map","score":0.5088798999786377},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3523404002189636},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2791960537433624},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.21734905242919922},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.19642430543899536},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.13898488879203796},{"id":"https://openalex.org/keywords/structural-engineering","display_name":"Structural engineering","score":0.1144886314868927},{"id":"https://openalex.org/keywords/geometry","display_name":"Geometry","score":0.07303720712661743}],"concepts":[{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.6543067097663879},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5700756311416626},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.5359848737716675},{"id":"https://openalex.org/C98214594","wikidata":"https://www.wikidata.org/wiki/Q850275","display_name":"Conformal map","level":2,"score":0.5088798999786377},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3523404002189636},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2791960537433624},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.21734905242919922},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.19642430543899536},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.13898488879203796},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.1144886314868927},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.07303720712661743},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2306.11128","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.11128","pdf_url":"https://arxiv.org/pdf/2306.11128","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2306.11128","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2306.11128","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2306.11128","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.11128","pdf_url":"https://arxiv.org/pdf/2306.11128","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"score":0.8199999928474426,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2920061524","https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2145821588"],"abstract_inverted_index":{"Before":[0],"taking":[1],"actions":[2,55,73],"in":[3,59,62,144,161,174],"an":[4,12,85,107,158],"environment":[5,176],"with":[6,74,136],"more":[7],"than":[8],"one":[9],"intelligent":[10],"agent,":[11],"autonomous":[13,159],"agent":[14,160],"may":[15],"benefit":[16],"from":[17],"reasoning":[18],"about":[19,32],"the":[20,33,36,54,63,94,110,118,133,155,169,175],"other":[21,57,172],"agents":[22,58,173],"and":[23,177],"utilizing":[24,178],"a":[25,28,43,75,128],"notion":[26],"of":[27,35,56,65,96,101,109,157,171],"guarantee":[29],"or":[30],"confidence":[31],"behavior":[34,170],"system.":[37],"In":[38],"this":[39],"article,":[40],"we":[41,92,103,125,150],"propose":[42],"novel":[44],"multi-agent":[45,148],"reinforcement":[46],"learning":[47],"(MARL)":[48],"algorithm":[49],"CAMMARL,":[50],"which":[51],"involves":[52],"modeling":[53,164],"different":[60],"situations":[61],"form":[64],"confident":[66],"sets,":[67,91],"i.e.,":[68],"sets":[69,167],"containing":[70],"their":[71],"true":[72,134],"high":[76,137],"probability.":[77],"We":[78],"then":[79],"use":[80,93],"these":[81],"estimates":[82,180],"to":[83,116,181],"inform":[84],"agent's":[86],"decision-making.":[87],"For":[88,123],"estimating":[89],"such":[90,179],"concept":[95],"conformal":[97,165],"predictions,":[98],"by":[99,163],"means":[100],"which,":[102],"not":[104],"only":[105],"obtain":[106],"estimate":[108],"most":[111],"probable":[112],"outcome":[113],"but":[114],"get":[115],"quantify":[117],"operable":[119],"uncertainty":[120],"as":[121],"well.":[122],"instance,":[124],"can":[126],"predict":[127],"set":[129],"that":[130,152],"provably":[131],"covers":[132],"predictions":[135],"probabilities":[138],"(e.g.,":[139],"95%).":[140],"Through":[141],"several":[142],"experiments":[143],"two":[145],"fully":[146],"cooperative":[147],"tasks,":[149],"show":[151],"CAMMARL":[153],"elevates":[154],"capabilities":[156],"MARL":[162],"prediction":[166],"over":[168],"enhance":[182],"its":[183],"policy":[184],"learning.":[185]},"counts_by_year":[],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
