{"id":"https://openalex.org/W7118022708","doi":"https://doi.org/10.48550/arxiv.2512.25063","title":"Many Minds from One Model: Bayesian-Inspired Transformers for Population Diversity","display_name":"Many Minds from One Model: Bayesian-Inspired Transformers for Population Diversity","publication_year":2025,"publication_date":"2025-12-31","ids":{"openalex":"https://openalex.org/W7118022708","doi":"https://doi.org/10.48550/arxiv.2512.25063"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2512.25063","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.25063","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2512.25063","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037401289","display_name":"Diji Yang","orcid":"https://orcid.org/0009-0005-1591-4846"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yang, Diji","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5121834288","display_name":"Yi Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yi","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5037401289"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.17749999463558197,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.17749999463558197,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.1598999947309494,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.13570000231266022,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.5142999887466431},{"id":"https://openalex.org/keywords/population","display_name":"Population","score":0.4909000098705292},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.4702000021934509},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.4578999876976013},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4171999990940094},{"id":"https://openalex.org/keywords/bayesian-inference","display_name":"Bayesian inference","score":0.40139999985694885},{"id":"https://openalex.org/keywords/normalization","display_name":"Normalization (sociology)","score":0.3617999851703644}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6051999926567078},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.570900022983551},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5681999921798706},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.5142999887466431},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.4909000098705292},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.4702000021934509},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.4578999876976013},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4171999990940094},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.40139999985694885},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.3617999851703644},{"id":"https://openalex.org/C207201462","wikidata":"https://www.wikidata.org/wiki/Q182505","display_name":"Bayes' theorem","level":3,"score":0.3147999942302704},{"id":"https://openalex.org/C521332185","wikidata":"https://www.wikidata.org/wiki/Q185816","display_name":"Analogy","level":2,"score":0.30959999561309814},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.29840001463890076},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.2838999927043915},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.28189998865127563},{"id":"https://openalex.org/C85847156","wikidata":"https://www.wikidata.org/wiki/Q59015987","display_name":"Verifiable secret sharing","level":3,"score":0.25920000672340393},{"id":"https://openalex.org/C101112237","wikidata":"https://www.wikidata.org/wiki/Q4874481","display_name":"Bayesian statistics","level":4,"score":0.25699999928474426},{"id":"https://openalex.org/C52740198","wikidata":"https://www.wikidata.org/wiki/Q1539564","display_name":"Importance sampling","level":3,"score":0.25290000438690186}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2512.25063","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.25063","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2512.25063","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.25063","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.7760249972343445,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Despite":[0],"their":[1],"scale":[2],"and":[3,126,133,140],"success,":[4],"modern":[5],"transformers":[6],"are":[7],"usually":[8],"trained":[9],"as":[10,64],"single-minded":[11],"systems:":[12],"optimization":[13],"produces":[14],"a":[15,21,65,68,74,100,119],"deterministic":[16,167],"set":[17],"of":[18,89,102,114],"parameters,":[19],"representing":[20],"single":[22,69,120],"functional":[23],"hypothesis":[24],"about":[25],"the":[26,30,86,112,123,152],"data.":[27],"Motivated":[28],"by":[29,78],"analogy":[31],"to":[32,63,166],"human":[33],"populations,":[34],"in":[35],"which":[36,50],"population-level":[37],"intelligence":[38],"emerges":[39],"from":[40,67,96,122],"diverse":[41,53,105],"individual":[42],"behaviors,":[43],"we":[44,117],"propose":[45],"Population":[46],"Bayesian":[47,92],"Transformers":[48],"(B-Trans),":[49],"enable":[51],"sampling":[52],"yet":[54],"coherent":[55],"transformer":[56],"large":[57],"language":[58],"model":[59,154],"instances":[60],"(hereafter":[61],"referred":[62],"'mind')":[66],"pre-trained":[70],"LLM.":[71],"B-Trans":[72,149],"introduces":[73],"Bayesian-inspired":[75],"posterior":[76],"proxy":[77,98],"injecting":[79],"stochasticity":[80],"directly":[81],"into":[82],"normalization":[83],"layers,":[84],"avoiding":[85],"prohibitive":[87],"cost":[88],"training":[90],"full":[91],"neural":[93],"networks.":[94],"Sampling":[95],"this":[97],"yields":[99],"population":[101],"minds":[103],"with":[104,143],"behaviors":[106],"while":[107,160],"maintaining":[108],"general":[109],"competence.":[110],"During":[111],"generation":[113,139],"each":[115],"response,":[116],"sample":[118],"realization":[121],"random":[124],"distribution":[125],"hold":[127],"it":[128],"fixed,":[129],"ensuring":[130],"temporal":[131],"consistency":[132],"reasoning":[134],"coherence.":[135],"Experiments":[136],"on":[137],"zero-shot":[138],"Reinforcement":[141],"Learning":[142],"Verifiable":[144],"Rewards":[145],"(RLVR)":[146],"demonstrate":[147],"that":[148],"effectively":[150],"leverages":[151],"stochastic":[153],"diversity,":[155],"yielding":[156],"superior":[157],"response":[158],"diversity":[159],"achieving":[161],"better":[162],"task":[163],"performance":[164],"compared":[165],"baselines.":[168]},"counts_by_year":[],"updated_date":"2026-01-20T17:24:06.736184","created_date":"2026-01-02T00:00:00"}
