{"id":"https://openalex.org/W7129539100","doi":"https://doi.org/10.48550/arxiv.2602.15012","title":"Cold-Start Personalization via Training-Free Priors from Structured World Models","display_name":"Cold-Start Personalization via Training-Free Priors from Structured World Models","publication_year":2026,"publication_date":"2026-02-16","ids":{"openalex":"https://openalex.org/W7129539100","doi":"https://doi.org/10.48550/arxiv.2602.15012"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.15012","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126203386","display_name":"Avinandan Bose","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Bose, Avinandan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022934996","display_name":"Shuyue Stella Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Shuyue Stella","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126223025","display_name":"Faeze Brahman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Brahman, Faeze","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126237414","display_name":"Pang Wei Koh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Koh, Pang Wei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033061754","display_name":"Simon S. Du","orcid":"https://orcid.org/0000-0003-0056-8299"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Du, Simon Shaolei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114482527","display_name":"Yulia Tsvetkov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tsvetkov, Yulia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102886973","display_name":"Maryam Fazel","orcid":"https://orcid.org/0000-0001-5329-4522"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fazel, Maryam","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126175926","display_name":"Lin Xiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao, Lin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5126244245","display_name":"Asli Celikyilmaz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Celikyilmaz, Asli","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5126203386"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.1842000037431717,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.1842000037431717,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.1462000012397766,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.06930000334978104,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.6870999932289124},{"id":"https://openalex.org/keywords/preference-learning","display_name":"Preference learning","score":0.6516000032424927},{"id":"https://openalex.org/keywords/preference-elicitation","display_name":"Preference elicitation","score":0.6313999891281128},{"id":"https://openalex.org/keywords/preference","display_name":"Preference","score":0.6053000092506409},{"id":"https://openalex.org/keywords/bayesian-network","display_name":"Bayesian network","score":0.5823000073432922},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5631999969482422},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5386999845504761},{"id":"https://openalex.org/keywords/personalization","display_name":"Personalization","score":0.5371000170707703},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.47200000286102295}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7024000287055969},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.6870999932289124},{"id":"https://openalex.org/C181204326","wikidata":"https://www.wikidata.org/wiki/Q7239820","display_name":"Preference learning","level":3,"score":0.6516000032424927},{"id":"https://openalex.org/C2777868144","wikidata":"https://www.wikidata.org/wiki/Q7239817","display_name":"Preference elicitation","level":3,"score":0.6313999891281128},{"id":"https://openalex.org/C2781249084","wikidata":"https://www.wikidata.org/wiki/Q908656","display_name":"Preference","level":2,"score":0.6053000092506409},{"id":"https://openalex.org/C33724603","wikidata":"https://www.wikidata.org/wiki/Q812540","display_name":"Bayesian network","level":2,"score":0.5823000073432922},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5691999793052673},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5631999969482422},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5386999845504761},{"id":"https://openalex.org/C183003079","wikidata":"https://www.wikidata.org/wiki/Q1000371","display_name":"Personalization","level":2,"score":0.5371000170707703},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5009999871253967},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.47200000286102295},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.4657999873161316},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.45489999651908875},{"id":"https://openalex.org/C155846161","wikidata":"https://www.wikidata.org/wiki/Q1143367","display_name":"Graphical model","level":2,"score":0.45210000872612},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.4424999952316284},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.42640000581741333},{"id":"https://openalex.org/C22367795","wikidata":"https://www.wikidata.org/wiki/Q7625208","display_name":"Structured prediction","level":2,"score":0.39340001344680786},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.3806000053882599},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.375900000333786},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.3682999908924103},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.27410000562667847},{"id":"https://openalex.org/C557471498","wikidata":"https://www.wikidata.org/wiki/Q554950","display_name":"Recommender system","level":2,"score":0.2734000086784363},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.2635999917984009},{"id":"https://openalex.org/C73602740","wikidata":"https://www.wikidata.org/wiki/Q7795822","display_name":"Thompson sampling","level":3,"score":0.2583000063896179},{"id":"https://openalex.org/C108650721","wikidata":"https://www.wikidata.org/wiki/Q1783253","display_name":"Counterfactual thinking","level":2,"score":0.251800000667572}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.15012","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.15012","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.15012","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.15012","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Cold-start":[0],"personalization":[1],"requires":[2,155],"inferring":[3],"user":[4,95],"preferences":[5,177],"through":[6],"interaction":[7],"when":[8],"no":[9],"user-specific":[10],"historical":[11],"data":[12],"is":[13,18,44,62,149,225],"available.":[14],"The":[15,147],"core":[16],"challenge":[17],"a":[19,35,47,116],"routing":[20],"problem:":[21],"each":[22],"task":[23],"admits":[24],"dozens":[25],"of":[26,80,120,201,233],"preference":[27,81,121,140,234],"dimensions,":[28],"yet":[29],"individual":[30],"users":[31,188],"care":[32],"about":[33],"only":[34,156],"few,":[36],"and":[37,83,106,137,154,164,174],"which":[38],"ones":[39],"matter":[40],"depends":[41],"on":[42],"who":[43],"asking.":[45],"With":[46],"limited":[48],"question":[49,91],"budget,":[50],"asking":[51],"without":[52],"structure":[53,79,104,232],"will":[54],"miss":[55],"the":[56,63,76,193,202,220,226,230],"dimensions":[57,143],"that":[58,93,219],"matter.":[59],"Reinforcement":[60],"learning":[61,105],"natural":[64],"formulation,":[65],"but":[66],"in":[67,84,222],"multi-turn":[68],"settings":[69],"its":[70,198],"terminal":[71],"reward":[72],"fails":[73],"to":[74,89,133,192,228],"exploit":[75,229],"factored,":[77],"per-criterion":[78],"data,":[82],"practice":[85],"learned":[86],"policies":[87],"collapse":[88],"static":[90],"sequences":[92],"ignore":[94],"responses.":[96],"We":[97],"propose":[98],"decomposing":[99],"cold-start":[100,223],"elicitation":[101,224],"into":[102],"offline":[103,123],"online":[107,132],"Bayesian":[108,130],"inference.":[109],"Pep":[110,167,196],"(Preference":[111],"Elicitation":[112],"with":[113,182,211],"Priors)":[114],"learns":[115],"structured":[117],"world":[118],"model":[119],"correlations":[122],"from":[124],"complete":[125,139],"profiles,":[126,141],"then":[127],"performs":[128],"training-free":[129],"inference":[131],"select":[134],"informative":[135],"questions":[136],"predict":[138],"including":[142],"never":[144],"asked":[145],"about.":[146],"framework":[148],"modular":[150],"across":[151],"downstream":[152],"solvers":[153],"simple":[157],"belief":[158],"models.":[159],"Across":[160],"medical,":[161],"mathematical,":[162],"social,":[163],"commonsense":[165],"reasoning,":[166],"achieves":[168],"80.8%":[169],"alignment":[170],"between":[171],"generated":[172],"responses":[173],"users'":[175],"stated":[176],"versus":[178,204,214],"68.5%":[179],"for":[180,206,216],"RL,":[181,217],"3-5x":[183],"fewer":[184],"interactions.":[185],"When":[186],"two":[187],"give":[189],"different":[190],"answers":[191],"same":[194],"question,":[195],"changes":[197],"follow-up":[199],"39-62%":[200],"time":[203],"0-28%":[205],"RL.":[207],"It":[208],"does":[209],"so":[210],"~10K":[212],"parameters":[213],"8B":[215],"showing":[218],"bottleneck":[221],"capability":[227],"factored":[231],"data.":[235]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-18T00:00:00"}
