{"id":"https://openalex.org/W7133350327","doi":"https://doi.org/10.48550/arxiv.2603.01973","title":"CharacterFlywheel: Scaling Iterative Improvement of Engaging and Steerable LLMs in Production","display_name":"CharacterFlywheel: Scaling Iterative Improvement of Engaging and Steerable LLMs in Production","publication_year":2026,"publication_date":"2026-03-02","ids":{"openalex":"https://openalex.org/W7133350327","doi":"https://doi.org/10.48550/arxiv.2603.01973"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.01973","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01973","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.01973","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5066141653","display_name":"Yixin Nie","orcid":"https://orcid.org/0009-0007-2689-7441"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Nie, Yixin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127962331","display_name":"Lin Guan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guan, Lin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127917721","display_name":"Zhongyao Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Zhongyao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081592288","display_name":"Anchit Gupta","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gupta, Anchit","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127901049","display_name":"Yipin Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Yipin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127926135","display_name":"Xiao Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Xiao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085639468","display_name":"Zhengping Zhou","orcid":"https://orcid.org/0000-0002-4706-5499"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Zhengping","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127960386","display_name":"Raymond Zeng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zeng, Raymond","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040149588","display_name":"Gelin Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Gelin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043939143","display_name":"Shigan Chu","orcid":"https://orcid.org/0000-0001-7000-1664"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chu, Shigan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017741672","display_name":"Ajay Thampi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Thampi, Ajay","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108817322","display_name":"W. Mu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mu, Wancen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127912402","display_name":"Nathan Shuster","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shuster, Nathan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127952189","display_name":"Ketong Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Ketong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128029460","display_name":"Lin X Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Lin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127944972","display_name":"Jason Brewer","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Brewer, Jason","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109422222","display_name":"Derek Hao Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Derek Hao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127928858","display_name":"Alexander McCauley","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"McCauley, Alexander","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124453212","display_name":"Jason Weston","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Weston, Jason","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104310142","display_name":"Sem Park","orcid":"https://orcid.org/0009-0007-9599-5301"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Sem","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127962816","display_name":"Na Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Na","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5127996207","display_name":"Kevin Tang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Kevin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":22,"corresponding_author_ids":["https://openalex.org/A5066141653"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13194","display_name":"ICT in Developing Communities","score":0.10220000147819519,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13194","display_name":"ICT in Developing Communities","score":0.10220000147819519,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.09880000352859497,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.08460000157356262,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/production","display_name":"Production (economics)","score":0.5462999939918518},{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.508400022983551},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.49639999866485596},{"id":"https://openalex.org/keywords/iterative-and-incremental-development","display_name":"Iterative and incremental development","score":0.43529999256134033},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.3646000027656555},{"id":"https://openalex.org/keywords/lift","display_name":"Lift (data mining)","score":0.3398999869823456},{"id":"https://openalex.org/keywords/public-engagement","display_name":"Public engagement","score":0.33550000190734863},{"id":"https://openalex.org/keywords/crowdsourcing","display_name":"Crowdsourcing","score":0.31709998846054077}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5663999915122986},{"id":"https://openalex.org/C2778348673","wikidata":"https://www.wikidata.org/wiki/Q739302","display_name":"Production (economics)","level":2,"score":0.5462999939918518},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.508400022983551},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.49639999866485596},{"id":"https://openalex.org/C143587482","wikidata":"https://www.wikidata.org/wiki/Q1543216","display_name":"Iterative and incremental development","level":2,"score":0.43529999256134033},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.36739999055862427},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3646000027656555},{"id":"https://openalex.org/C139002025","wikidata":"https://www.wikidata.org/wiki/Q3001212","display_name":"Lift (data mining)","level":2,"score":0.3398999869823456},{"id":"https://openalex.org/C205112559","wikidata":"https://www.wikidata.org/wiki/Q7257735","display_name":"Public engagement","level":2,"score":0.33550000190734863},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3352000117301941},{"id":"https://openalex.org/C62230096","wikidata":"https://www.wikidata.org/wiki/Q275969","display_name":"Crowdsourcing","level":2,"score":0.31709998846054077},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.3098999857902527},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.3075000047683716},{"id":"https://openalex.org/C117619785","wikidata":"https://www.wikidata.org/wiki/Q6094414","display_name":"Iterative learning control","level":3,"score":0.30160000920295715},{"id":"https://openalex.org/C67469775","wikidata":"https://www.wikidata.org/wiki/Q304922","display_name":"Social dynamics","level":2,"score":0.30000001192092896},{"id":"https://openalex.org/C2776193868","wikidata":"https://www.wikidata.org/wiki/Q5154950","display_name":"Community engagement","level":2,"score":0.29739999771118164},{"id":"https://openalex.org/C127627568","wikidata":"https://www.wikidata.org/wiki/Q1639361","display_name":"Sociotechnical system","level":2,"score":0.27880001068115234},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.27320000529289246},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.267300009727478},{"id":"https://openalex.org/C106246047","wikidata":"https://www.wikidata.org/wiki/Q4928435","display_name":"Iterative design","level":3,"score":0.26460000872612},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.25699999928474426},{"id":"https://openalex.org/C79416737","wikidata":"https://www.wikidata.org/wiki/Q2305519","display_name":"Social learning","level":2,"score":0.2558000087738037},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.25540000200271606},{"id":"https://openalex.org/C2780984029","wikidata":"https://www.wikidata.org/wiki/Q2930198","display_name":"Stakeholder engagement","level":2,"score":0.25529998540878296},{"id":"https://openalex.org/C70118762","wikidata":"https://www.wikidata.org/wiki/Q376934","display_name":"Social engineering (security)","level":2,"score":0.25459998846054077},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.25369998812675476},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.25270000100135803}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.01973","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01973","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.01973","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01973","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"This":[0],"report":[1],"presents":[2],"CharacterFlywheel,":[3],"an":[4],"iterative":[5],"flywheel":[6],"process":[7,118],"for":[8,159],"improving":[9],"large":[10],"language":[11],"models":[12,30,67],"(LLMs)":[13],"in":[14,83,88,96,178],"production":[15,164],"social":[16,179],"chat":[17],"applications":[18,180],"across":[19,31],"Instagram,":[20],"WhatsApp,":[21],"and":[22,39,86,106,127,140,143,162,174],"Messenger.":[23],"Starting":[24],"from":[25,36,46,102,110],"LLaMA":[26],"3.1,":[27],"we":[28,52],"refined":[29],"15":[32],"generations":[33],"using":[34],"data":[35,121],"both":[37,141],"internal":[38],"external":[40],"real-user":[41],"traffic.":[42],"Through":[43],"continuous":[44],"deployments":[45],"July":[47],"2024":[48],"to":[49,80,104,112,125,146],"April":[50],"2025,":[51],"conducted":[53],"controlled":[54],"7-day":[55],"A/B":[56],"tests":[57],"showing":[58],"consistent":[59],"engagement":[60,84,89,132],"improvements:":[61],"7":[62],"of":[63,131,176,183],"8":[64],"newly":[65],"deployed":[66],"demonstrated":[68],"positive":[69],"lift":[70],"over":[71],"the":[72,75,116,129,171],"baseline,":[73],"with":[74,98],"strongest":[76],"performers":[77],"achieving":[78],"up":[79],"8.8%":[81],"improvement":[82],"breadth":[85],"19.4%":[87],"depth.":[90],"We":[91,114,154],"also":[92,155],"observed":[93],"substantial":[94],"gains":[95],"steerability,":[97],"instruction":[99,107],"following":[100],"increasing":[101],"59.2%":[103],"84.8%":[105],"violations":[108],"decreasing":[109],"26.6%":[111],"5.8%.":[113],"detail":[115],"CharacterFlywheel":[117],"which":[119],"integrates":[120],"curation,":[122],"reward":[123],"modeling":[124],"estimate":[126],"interpolate":[128],"landscape":[130],"metrics,":[133],"supervised":[134],"fine-tuning":[135],"(SFT),":[136],"reinforcement":[137],"learning":[138],"(RL),":[139],"offline":[142],"online":[144],"evaluation":[145],"ensure":[147],"reliable":[148],"progress":[149],"at":[150,166],"each":[151],"optimization":[152],"step.":[153],"discuss":[156],"our":[157],"methods":[158],"overfitting":[160],"prevention":[161],"navigating":[163],"dynamics":[165],"scale.":[167],"These":[168],"contributions":[169],"advance":[170],"scientific":[172],"rigor":[173],"understanding":[175],"LLMs":[177],"serving":[181],"millions":[182],"users.":[184]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-03-04T00:00:00"}
