{"id":"https://openalex.org/W7162633819","doi":"https://doi.org/10.48550/arxiv.2605.27832","title":"Playing with Words, Improving with Rewards: Training Language Models for Creative Association","display_name":"Playing with Words, Improving with Rewards: Training Language Models for Creative Association","publication_year":2026,"publication_date":"2026-05-27","ids":{"openalex":"https://openalex.org/W7162633819","doi":"https://doi.org/10.48550/arxiv.2605.27832"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.27832","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27832","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.27832","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047400791","display_name":"Vijeta Deshpande","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Deshpande, Vijeta","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137270252","display_name":"Namrata Shivagunde","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shivagunde, Namrata","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080743303","display_name":"Sherin Muckatira","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Muckatira, Sherin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137265833","display_name":"Hadrien Glaude","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Glaude, Hadrien","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039290656","display_name":"Mikhail Gronas","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gronas, Mikhail","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121221812","display_name":"Claire Stevenson","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stevenson, Claire","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137249617","display_name":"Roger Beaty","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Beaty, Roger","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5071360545","display_name":"Anna Rumshisky","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rumshisky, Anna","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.3513999879360199,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.3513999879360199,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11079","display_name":"Creativity in Education and Neuroscience","score":0.2084999978542328,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.06430000066757202,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/creativity","display_name":"Creativity","score":0.8870000243186951},{"id":"https://openalex.org/keywords/verifiable-secret-sharing","display_name":"Verifiable secret sharing","score":0.5069000124931335},{"id":"https://openalex.org/keywords/association","display_name":"Association (psychology)","score":0.49959999322891235},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.44369998574256897},{"id":"https://openalex.org/keywords/convergent-thinking","display_name":"Convergent thinking","score":0.3321000039577484}],"concepts":[{"id":"https://openalex.org/C11012388","wikidata":"https://www.wikidata.org/wiki/Q170658","display_name":"Creativity","level":2,"score":0.8870000243186951},{"id":"https://openalex.org/C85847156","wikidata":"https://www.wikidata.org/wiki/Q59015987","display_name":"Verifiable secret sharing","level":3,"score":0.5069000124931335},{"id":"https://openalex.org/C142853389","wikidata":"https://www.wikidata.org/wiki/Q744778","display_name":"Association (psychology)","level":2,"score":0.49959999322891235},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.4706999957561493},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.44369998574256897},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.42660000920295715},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3603000044822693},{"id":"https://openalex.org/C171560490","wikidata":"https://www.wikidata.org/wiki/Q3374857","display_name":"Convergent thinking","level":4,"score":0.3321000039577484},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.3133000135421753},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3098999857902527},{"id":"https://openalex.org/C145420912","wikidata":"https://www.wikidata.org/wiki/Q853077","display_name":"Mathematics education","level":1,"score":0.3084000051021576},{"id":"https://openalex.org/C52641369","wikidata":"https://www.wikidata.org/wiki/Q1426250","display_name":"Creativity technique","level":3,"score":0.27410000562667847},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.2644999921321869},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.2572999894618988}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.27832","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27832","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.27832","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27832","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"are":[4],"being":[5],"applied":[6],"to":[7,23,172],"increasingly":[8],"difficult":[9],"problems":[10],"and":[11,32,65,80,93,96,102,124,169],"use":[12],"cases.":[13],"To":[14],"navigate":[15],"their":[16],"vast":[17],"solution":[18,171],"spaces":[19],"effectively,":[20],"LLMs":[21,40,50,174],"need":[22],"be":[24],"creative.":[25],"Yet":[26],"the":[27,33,58,109,114,122,131,136,155],"subjective":[28],"nature":[29],"of":[30,35,62,133,146],"creativity":[31,42,101,118,143],"limits":[34],"human":[36,78],"judgment":[37,79],"make":[38],"training":[39],"for":[41,175],"especially":[43],"challenging.":[44],"As":[45],"a":[46,53,167],"solution,":[47],"we":[48],"train":[49,81,90,173],"on":[51,99,161],"Codenames,":[52],"word-association":[54],"game":[55],"that":[56,108],"exercises":[57],"two":[59],"central":[60],"axes":[61],"creativity,":[63],"divergent":[64],"convergent":[66],"thinking,":[67],"while":[68,121],"yielding":[69],"objectively":[70],"verifiable":[71],"outcomes.":[72],"This":[73],"verifiability":[74],"lets":[75],"us":[76],"bypass":[77],"with":[82,85,149],"Reinforcement":[83],"Learning":[84],"Verifiable":[86],"Rewards":[87],"(RLVR).":[88],"We":[89,106],"Qwen3-1.7B,":[91],"4B,":[92],"8B":[94,115,137],"models":[95,126,157],"evaluate":[97],"them":[98],"ten":[100],"four":[103],"reasoning":[104,128,152,162],"benchmarks.":[105],"find":[107],"precision-diversity":[110],"trade-off":[111],"is":[112],"scale-dependent:":[113],"model":[116,138],"prioritizes":[117],"over":[119],"precision,":[120],"1.7B":[123],"4B":[125],"gain":[127],"precision":[129],"at":[130],"cost":[132],"creativity.":[134,176],"Concretely,":[135],"shows":[139],"modest":[140],"but":[141],"consistent":[142],"gains":[144,160],"(8":[145],"10":[147],"benchmarks)":[148],"only":[150],"minor":[151],"degradation,":[153],"whereas":[154],"smaller":[156],"achieve":[158],"substantial":[159],"tasks.":[163],"Our":[164],"study":[165],"presents":[166],"scalable":[168],"effective":[170]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-29T00:00:00"}
