{"id":"https://openalex.org/W4400434131","doi":"https://doi.org/10.48550/arxiv.2407.03884","title":"ChatSOP: An SOP-Guided MCTS Planning Framework for Controllable LLM Dialogue Agents","display_name":"ChatSOP: An SOP-Guided MCTS Planning Framework for Controllable LLM Dialogue Agents","publication_year":2024,"publication_date":"2024-07-04","ids":{"openalex":"https://openalex.org/W4400434131","doi":"https://doi.org/10.48550/arxiv.2407.03884"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2407.03884","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.03884","pdf_url":"https://arxiv.org/pdf/2407.03884","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2407.03884","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113281905","display_name":"Zhigen Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Li, Zhigen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101394599","display_name":"Jianxiang Peng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Peng, Jianxiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101856072","display_name":"Yanmeng Wang","orcid":"https://orcid.org/0000-0002-5423-0990"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yanmeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Cao, Yong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Yong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101285252","display_name":"Tianhao Shen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Tianhao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100419543","display_name":"Minghui Zhang","orcid":"https://orcid.org/0000-0002-7102-7505"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Minghui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101245112","display_name":"Linxi Su","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Su, Linxi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110367017","display_name":"Shang Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Shang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055916281","display_name":"Yihang Wu","orcid":"https://orcid.org/0000-0002-8640-8650"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Yihang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100751794","display_name":"Yuqian Wang","orcid":"https://orcid.org/0000-0003-3755-0586"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yuqian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100423435","display_name":"Ye Wang","orcid":"https://orcid.org/0000-0002-0123-1260"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Ye","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100727084","display_name":"Wei Hu","orcid":"https://orcid.org/0000-0003-3635-6335"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Wei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100462038","display_name":"Jianfeng Li","orcid":"https://orcid.org/0000-0003-4055-7017"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Jianfeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100702017","display_name":"Shaojun Wang","orcid":"https://orcid.org/0009-0001-8955-8566"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Shaojun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101931947","display_name":"Jing Xiao","orcid":"https://orcid.org/0000-0001-6141-677X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao, Jing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5055232825","display_name":"Deyi Xiong","orcid":"https://orcid.org/0000-0002-2353-5038"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiong, Deyi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":16,"corresponding_author_ids":["https://openalex.org/A5113281905"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9861999750137329,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9861999750137329,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9821000099182129,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9706000089645386,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6555946469306946},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.41244786977767944},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.34432828426361084},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.05853322148323059}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6555946469306946},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.41244786977767944},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.34432828426361084},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.05853322148323059}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2407.03884","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.03884","pdf_url":"https://arxiv.org/pdf/2407.03884","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2407.03884","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2407.03884","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2407.03884","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2407.03884","pdf_url":"https://arxiv.org/pdf/2407.03884","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4400434131.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2382290278","https://openalex.org/W4395014643"],"abstract_inverted_index":{"Dialogue":[0],"agents":[1],"powered":[2],"by":[3],"Large":[4],"Language":[5],"Models":[6],"(LLMs)":[7],"show":[8],"superior":[9],"performance":[10],"in":[11,145],"various":[12],"tasks.":[13],"Despite":[14],"the":[15,68,134],"better":[16],"user":[17],"understanding":[18],"and":[19,93,118,155,164],"human-like":[20],"responses,":[21],"their":[22],"**lack":[23],"of":[24,70,109,136],"controllability**":[25],"remains":[26],"a":[27,55,79,87,103,142],"key":[28],"challenge,":[29],"often":[30],"leading":[31],"to":[32,47,66,149],"unfocused":[33],"conversations":[34],"or":[35],"task":[36],"failure.":[37],"To":[38,74],"address":[39],"this,":[40,76],"we":[41,52,77,101],"introduce":[42],"Standard":[43],"Operating":[44],"Procedure":[45],"(SOP)":[46],"regulate":[48],"dialogue":[49,72],"flow.":[50],"Specifically,":[51],"propose":[53,102],"**ChatSOP**,":[54],"novel":[56,104],"SOP-guided":[57,120],"Monte":[58,121],"Carlo":[59,122],"Tree":[60,123],"Search":[61,124],"(MCTS)":[62],"planning":[63,128],"framework":[64],"designed":[65],"enhance":[67],"controllability":[69],"LLM-driven":[71],"agents.":[73],"enable":[75],"curate":[78],"dataset":[80],"comprising":[81],"SOP-annotated":[82],"multi-scenario":[83],"dialogues,":[84],"generated":[85],"using":[86],"semi-automated":[88],"role-playing":[89],"system":[90],"with":[91,112],"GPT-4o":[92],"validated":[94],"through":[95],"strict":[96],"manual":[97],"quality":[98],"control.":[99],"Additionally,":[100],"method":[105],"that":[106],"integrates":[107],"Chain":[108],"Thought":[110],"reasoning":[111],"supervised":[113],"fine-tuning":[114],"for":[115,125,160],"SOP":[116],"prediction":[117],"utilizes":[119],"optimal":[126],"action":[127,146],"during":[129],"dialogues.":[130],"Experimental":[131],"results":[132],"demonstrate":[133],"effectiveness":[135],"our":[137],"method,":[138],"such":[139],"as":[140],"achieving":[141],"27.95%":[143],"improvement":[144],"accuracy":[147],"compared":[148],"baseline":[150],"models":[151],"based":[152],"on":[153],"GPT-3.5":[154],"also":[156],"showing":[157],"notable":[158],"gains":[159],"open-source":[161],"models.":[162],"Dataset":[163],"codes":[165],"are":[166],"publicly":[167],"available.":[168]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-05T09:01:59.212387","created_date":"2024-07-09T00:00:00"}
