{"id":"https://openalex.org/W4416765817","doi":"https://doi.org/10.48550/arxiv.2511.19562","title":"Trust-Based Social Learning for Communication (TSLEC) Protocol Evolution in Multi-Agent Reinforcement Learning","display_name":"Trust-Based Social Learning for Communication (TSLEC) Protocol Evolution in Multi-Agent Reinforcement Learning","publication_year":2025,"publication_date":"2025-11-24","ids":{"openalex":"https://openalex.org/W4416765817","doi":"https://doi.org/10.48550/arxiv.2511.19562"},"language":null,"primary_location":{"id":"pmh:oai:arXiv.org:2511.19562","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2511.19562","pdf_url":"https://arxiv.org/pdf/2511.19562","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2511.19562","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037956466","display_name":"Abraham Itzhak Weinberg","orcid":"https://orcid.org/0000-0002-2505-9653"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Weinberg, Abraham Itzhak","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5037956466"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.26820001006126404,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.26820001006126404,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12090","display_name":"Language and cultural evolution","score":0.06300000101327896,"subfield":{"id":"https://openalex.org/subfields/3316","display_name":"Cultural Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11883","display_name":"Embodied and Extended Cognition","score":0.0471000000834465,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.666700005531311},{"id":"https://openalex.org/keywords/social-learning","display_name":"Social learning","score":0.6437000036239624},{"id":"https://openalex.org/keywords/protocol","display_name":"Protocol (science)","score":0.5473999977111816},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.5235999822616577},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.4277999997138977},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.4203000068664551},{"id":"https://openalex.org/keywords/knowledge-transfer","display_name":"Knowledge transfer","score":0.33180001378059387},{"id":"https://openalex.org/keywords/social-knowledge","display_name":"Social knowledge","score":0.30660000443458557}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.666700005531311},{"id":"https://openalex.org/C79416737","wikidata":"https://www.wikidata.org/wiki/Q2305519","display_name":"Social learning","level":2,"score":0.6437000036239624},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6258000135421753},{"id":"https://openalex.org/C2780385302","wikidata":"https://www.wikidata.org/wiki/Q367158","display_name":"Protocol (science)","level":3,"score":0.5473999977111816},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.5235999822616577},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44179999828338623},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.4277999997138977},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.4203000068664551},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.3555999994277954},{"id":"https://openalex.org/C2776960227","wikidata":"https://www.wikidata.org/wiki/Q2586354","display_name":"Knowledge transfer","level":2,"score":0.33180001378059387},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.3125},{"id":"https://openalex.org/C2986930172","wikidata":"https://www.wikidata.org/wiki/Q1116133","display_name":"Social knowledge","level":2,"score":0.30660000443458557},{"id":"https://openalex.org/C2983704927","wikidata":"https://www.wikidata.org/wiki/Q11024","display_name":"Social communication","level":2,"score":0.30640000104904175},{"id":"https://openalex.org/C12269588","wikidata":"https://www.wikidata.org/wiki/Q132364","display_name":"Communications protocol","level":2,"score":0.30550000071525574},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.299699991941452},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.29760000109672546},{"id":"https://openalex.org/C130064352","wikidata":"https://www.wikidata.org/wiki/Q853725","display_name":"Social relation","level":2,"score":0.28200000524520874},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.27730000019073486},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.27619999647140503},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.26109999418258667},{"id":"https://openalex.org/C47932503","wikidata":"https://www.wikidata.org/wiki/Q5395689","display_name":"Error-driven learning","level":3,"score":0.2599000036716461},{"id":"https://openalex.org/C131158328","wikidata":"https://www.wikidata.org/wiki/Q1307337","display_name":"Social influence","level":2,"score":0.2556999921798706},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.2513999938964844}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2511.19562","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2511.19562","pdf_url":"https://arxiv.org/pdf/2511.19562","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2511.19562","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.19562","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2511.19562","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2511.19562","pdf_url":"https://arxiv.org/pdf/2511.19562","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Emergent":[0,25],"communication":[1,120],"in":[2,11,121],"multi-agent":[3,122],"systems":[4],"typically":[5],"occurs":[6],"through":[7],"independent":[8,73],"learning,":[9],"resulting":[10],"slow":[12],"convergence":[13],"and":[14],"potentially":[15],"suboptimal":[16],"protocols.":[17],"We":[18],"introduce":[19],"TSLEC":[20],"(Trust-Based":[21],"Social":[22],"Learning":[23],"with":[24,37,47,97],"Communication),":[26],"a":[27],"framework":[28],"where":[29],"agents":[30],"explicitly":[31],"teach":[32],"successful":[33],"strategies":[34],"to":[35,72],"peers,":[36],"knowledge":[38,108],"transfer":[39],"modulated":[40],"by":[41,62],"learned":[42],"trust":[43],"relationships.":[44],"Through":[45],"experiments":[46],"100":[48],"episodes":[49],"across":[50],"30":[51],"random":[52],"seeds,":[53],"we":[54],"demonstrate":[55],"that":[56,82,113],"trust-based":[57],"social":[58,115],"learning":[59,116],"reduces":[60],"episodes-to-convergence":[61],"23.9%":[63],"(p":[64],"&lt;":[65,104],"0.001,":[66],"Cohen's":[67],"d":[68],"=":[69,80,101],"1.98)":[70],"compared":[71],"emergence,":[74],"while":[75],"producing":[76],"compositional":[77],"protocols":[78],"(C":[79],"0.38)":[81],"remain":[83],"robust":[84],"under":[85],"dynamic":[86],"objectives":[87],"(Phi":[88],"&gt;":[89],"0.867":[90],"decoding":[91],"accuracy).":[92],"Trust":[93],"scores":[94],"strongly":[95],"correlate":[96],"teaching":[98],"quality":[99],"(r":[100],"0.743,":[102],"p":[103],"0.001),":[105],"enabling":[106],"effective":[107],"filtering.":[109],"Our":[110],"results":[111],"establish":[112],"explicit":[114],"fundamentally":[117],"accelerates":[118],"emergent":[119],"coordination.":[123]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-11-28T00:00:00"}
