{"id":"https://openalex.org/W7161894009","doi":"https://doi.org/10.48550/arxiv.2605.20087","title":"ThoughtTrace: Understanding User Thoughts in Real-World LLM Interactions","display_name":"ThoughtTrace: Understanding User Thoughts in Real-World LLM Interactions","publication_year":2026,"publication_date":"2026-05-19","ids":{"openalex":"https://openalex.org/W7161894009","doi":"https://doi.org/10.48550/arxiv.2605.20087"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.20087","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.20087","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.20087","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136581425","display_name":"Chuanyang Jin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Chuanyang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136535414","display_name":"Binze Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Binze","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136562466","display_name":"Haopeng Xie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xie, Haopeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061556449","display_name":"Cathy Mengying Fang","orcid":"https://orcid.org/0000-0003-4684-7058"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fang, Cathy Mengying","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136570185","display_name":"Tianjian Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Tianjian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001884064","display_name":"Shayne Longpre","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Longpre, Shayne","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136604598","display_name":"Hongxiang Gu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gu, Hongxiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063752328","display_name":"Maximillian Chen","orcid":"https://orcid.org/0000-0003-4374-9110"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Maximillian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5005908625","display_name":"Tianmin Shu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shu, Tianmin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12128","display_name":"AI in Service Interactions","score":0.5468000173568726,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12128","display_name":"AI in Service Interactions","score":0.5468000173568726,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.07919999957084656,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.0723000019788742,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/conversation","display_name":"Conversation","score":0.6446999907493591},{"id":"https://openalex.org/keywords/conversation-analysis","display_name":"Conversation analysis","score":0.44850000739097595},{"id":"https://openalex.org/keywords/cognition","display_name":"Cognition","score":0.43959999084472656},{"id":"https://openalex.org/keywords/frontier","display_name":"Frontier","score":0.42820000648498535},{"id":"https://openalex.org/keywords/dynamics","display_name":"Dynamics (music)","score":0.3619000017642975},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.36039999127388},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.34209999442100525}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6470000147819519},{"id":"https://openalex.org/C2777200299","wikidata":"https://www.wikidata.org/wiki/Q52943","display_name":"Conversation","level":2,"score":0.6446999907493591},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.47859999537467957},{"id":"https://openalex.org/C2780829048","wikidata":"https://www.wikidata.org/wiki/Q1624720","display_name":"Conversation analysis","level":3,"score":0.44850000739097595},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.43959999084472656},{"id":"https://openalex.org/C2778571376","wikidata":"https://www.wikidata.org/wiki/Q1355821","display_name":"Frontier","level":2,"score":0.42820000648498535},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.4169999957084656},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.36469998955726624},{"id":"https://openalex.org/C145912823","wikidata":"https://www.wikidata.org/wiki/Q113558","display_name":"Dynamics (music)","level":2,"score":0.3619000017642975},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.36039999127388},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.34209999442100525},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3352999985218048},{"id":"https://openalex.org/C173853756","wikidata":"https://www.wikidata.org/wiki/Q86915","display_name":"Dialog box","level":2,"score":0.31450000405311584},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.31189998984336853},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.310699999332428},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.29120001196861267},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.2870999872684479},{"id":"https://openalex.org/C100609095","wikidata":"https://www.wikidata.org/wiki/Q1335050","display_name":"Embodied cognition","level":2,"score":0.28630000352859497},{"id":"https://openalex.org/C48677424","wikidata":"https://www.wikidata.org/wiki/Q6888088","display_name":"Mode (computer interface)","level":2,"score":0.2728999853134155},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.26809999346733093},{"id":"https://openalex.org/C2983448237","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Language understanding","level":2,"score":0.260699987411499},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.2563999891281128},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.25450000166893005},{"id":"https://openalex.org/C67712803","wikidata":"https://www.wikidata.org/wiki/Q7901853","display_name":"User modeling","level":3,"score":0.2531000077724457}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.20087","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.20087","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.20087","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.20087","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.6046368479728699}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Conversational":[0],"AI":[1],"has":[2],"now":[3],"reached":[4],"billions":[5],"of":[6,103],"users,":[7,50],"yet":[8],"existing":[9],"datasets":[10],"capture":[11],"only":[12],"what":[13,17],"people":[14],"say,":[15],"not":[16],"they":[18],"think.":[19],"We":[20,98],"introduce":[21],"ThoughtTrace,":[22],"the":[23,101,139],"first":[24],"large-scale":[25],"dataset":[26],"that":[27,67,75,152],"pairs":[28],"real-world":[29],"multi-turn":[30],"human--AI":[31,143],"conversations":[32],"with":[33],"users'":[34,158],"self-reported":[35],"thoughts:":[36],"their":[37],"reasons":[38],"for":[39,83,105,123,137,149],"sending":[40],"prompts":[41],"and":[42,55,74,93,145,155,162],"reactions":[43],"to":[44,86,95,157],"assistant":[45],"responses.":[46],"ThoughtTrace":[47,68,128],"comprises":[48],"1,058":[49],"2,155":[51],"conversations,":[52],"17,058":[53],"turns,":[54],"10,174":[56],"thought":[57],"annotations":[58],"collected":[59],"across":[60],"20":[61],"language":[62],"models.":[63],"Our":[64],"analysis":[65],"shows":[66],"captures":[69],"long-horizon,":[70],"topically":[71],"diverse":[72,90],"interactions,":[73],"thoughts":[76,104,109,131],"are":[77],"semantically":[78],"distinct":[79],"from":[80,88],"messages,":[81],"difficult":[82],"frontier":[84],"LLMs":[85],"infer":[87],"context,":[89],"in":[91],"content,":[92],"tied":[94],"conversation":[96],"stages.":[97],"further":[99],"demonstrate":[100],"utility":[102],"downstream":[106],"modeling.":[107],"First,":[108],"improve":[110],"user-behavior":[111],"prediction":[112],"as":[113,132],"inference-time":[114],"context.":[115],"Second,":[116],"thought-guided":[117],"rewrites":[118],"provide":[119],"fine-grained":[120],"alignment":[121],"signals":[122],"training":[124],"personalized":[125],"assistants.":[126],"Together,":[127],"establishes":[129],"user":[130],"a":[133,147],"new":[134],"data":[135],"modality":[136],"studying":[138],"cognitive":[140],"dynamics":[141],"behind":[142],"interaction":[144],"provides":[146],"foundation":[148],"building":[150],"assistants":[151],"better":[153],"understand":[154],"adapt":[156],"latent":[159],"goals,":[160],"preferences,":[161],"needs.":[163]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-21T00:00:00"}
