{"id":"https://openalex.org/W4410552403","doi":"https://doi.org/10.1145/3736580","title":"RESIST: Rationale-Enhanced and Reward Model-Based End-to-End Social Influence Dialogue System","display_name":"RESIST: Rationale-Enhanced and Reward Model-Based End-to-End Social Influence Dialogue System","publication_year":2025,"publication_date":"2025-05-21","ids":{"openalex":"https://openalex.org/W4410552403","doi":"https://doi.org/10.1145/3736580"},"language":"en","primary_location":{"id":"doi:10.1145/3736580","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3736580","pdf_url":null,"source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Tong Wu","orcid":"https://orcid.org/0009-0002-5870-4556"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Tong Wu","raw_affiliation_strings":["AHU-IAI AI Joint Laboratory, Anhui University, Hefei, China","AHU-IAI AI Joint Laboratory, Anhui University, China"],"affiliations":[{"raw_affiliation_string":"AHU-IAI AI Joint Laboratory, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]},{"raw_affiliation_string":"AHU-IAI AI Joint Laboratory, Anhui University, China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028284977","display_name":"Jinhua Zhu","orcid":"https://orcid.org/0000-0003-2157-9077"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinhua Zhu","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China","University of Science and Technology of China, China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"University of Science and Technology of China, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046805800","display_name":"Wengang Zhou","orcid":"https://orcid.org/0000-0003-1690-9836"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wengang Zhou","raw_affiliation_strings":["EEIS Department, University of Science and Technology of China, Hefei, China","University of Science and Technology of China, China"],"affiliations":[{"raw_affiliation_string":"EEIS Department, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"University of Science and Technology of China, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078141810","display_name":"Houqiang Li","orcid":"https://orcid.org/0000-0003-2188-3028"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Houqiang Li","raw_affiliation_strings":["EEIS Department, University of Science and Technology of China, Hefei, China","University of Science and Technology of China, China"],"affiliations":[{"raw_affiliation_string":"EEIS Department, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"University of Science and Technology of China, China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I143868143"],"apc_list":null,"apc_paid":null,"fwci":2.3568,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.89150535,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"21","issue":"6","first_page":"1","last_page":"23"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.79941725730896},{"id":"https://openalex.org/keywords/end-to-end-principle","display_name":"End-to-end principle","score":0.7770029306411743},{"id":"https://openalex.org/keywords/end-user","display_name":"End user","score":0.5443410873413086},{"id":"https://openalex.org/keywords/resist","display_name":"Resist","score":0.46030524373054504},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3924132287502289},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.30069345235824585},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.24598601460456848}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.79941725730896},{"id":"https://openalex.org/C74296488","wikidata":"https://www.wikidata.org/wiki/Q2527392","display_name":"End-to-end principle","level":2,"score":0.7770029306411743},{"id":"https://openalex.org/C91262260","wikidata":"https://www.wikidata.org/wiki/Q528074","display_name":"End user","level":2,"score":0.5443410873413086},{"id":"https://openalex.org/C53524968","wikidata":"https://www.wikidata.org/wiki/Q7315582","display_name":"Resist","level":3,"score":0.46030524373054504},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3924132287502289},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.30069345235824585},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.24598601460456848},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3736580","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3736580","pdf_url":null,"source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1280917168","display_name":null,"funder_award_id":"623B2097","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W2602753196","https://openalex.org/W2808440041","https://openalex.org/W2952607215","https://openalex.org/W2962852262","https://openalex.org/W2963170138","https://openalex.org/W2979881951","https://openalex.org/W2988937804","https://openalex.org/W3019549080","https://openalex.org/W3116890199","https://openalex.org/W3153184597","https://openalex.org/W3154988854","https://openalex.org/W3170831269","https://openalex.org/W3173710861","https://openalex.org/W3174116563","https://openalex.org/W3210414322","https://openalex.org/W4221143046","https://openalex.org/W4226278401","https://openalex.org/W4285161221","https://openalex.org/W4292779060","https://openalex.org/W4300827275","https://openalex.org/W4309695664","https://openalex.org/W4385569749","https://openalex.org/W4385569870","https://openalex.org/W4385570169","https://openalex.org/W4385570282","https://openalex.org/W4385571411","https://openalex.org/W4385571659","https://openalex.org/W4385571690","https://openalex.org/W4385573018","https://openalex.org/W4385573049","https://openalex.org/W4385763941","https://openalex.org/W4386566904","https://openalex.org/W4389519096","https://openalex.org/W4389520244","https://openalex.org/W4402671642","https://openalex.org/W4402715063","https://openalex.org/W4404525274","https://openalex.org/W6778883912"],"related_works":["https://openalex.org/W4299590256","https://openalex.org/W2151749779","https://openalex.org/W3163634122","https://openalex.org/W2110442089","https://openalex.org/W2166381389","https://openalex.org/W4315785295","https://openalex.org/W4393280045","https://openalex.org/W2054736184","https://openalex.org/W3159728998","https://openalex.org/W2677083173"],"abstract_inverted_index":{"Developing":[0],"proactive":[1,253],"social":[2,88,195],"influence":[3,89,196],"dialogue":[4,34,68,90,115,180,256],"systems":[5],"presents":[6],"a":[7,82,125,151,240,259],"significant":[8],"challenge,":[9],"particularly":[10],"in":[11,66,229],"non-cooperative":[12],"scenarios":[13],"where":[14],"the":[15,23,58,114,138,146,156,177,199,221,252,263,279],"system\u2019s":[16],"goals":[17],"may":[18],"conflict":[19],"with":[20,258,289],"those":[21],"of":[22,60,145,203,209,223,255,266,282],"user.":[24],"Traditional":[25],"methods":[26,228],"often":[27,41],"focus":[28,261],"on":[29,45,193,262],"training":[30,83,205,250],"models":[31,217,269],"to":[32,86,123,136,174,185,246],"plan":[33],"strategies,":[35],"but":[36],"since":[37],"human":[38],"strategies":[39,181],"are":[40,133],"sub-optimal,":[42],"relying":[43],"solely":[44],"manually":[46,165],"collected":[47],"data":[48,139],"can":[49],"be":[50,296],"problematic.":[51],"While":[52],"Large":[53],"Language":[54],"Models":[55],"(LLMs)":[56],"facilitate":[57],"generation":[59],"high-quality":[61],"synthetic":[62],"dialogues,":[63],"their":[64],"effectiveness":[65,200],"strategic":[67,237,280],"under":[69],"zero-shot":[70],"or":[71],"few-shot":[72],"conditions":[73],"is":[74],"inconsistent.":[75],"To":[76,112],"address":[77],"these":[78],"issues,":[79],"we":[80,118,149,170,235],"propose":[81],"framework":[84],"applicable":[85],"multiple":[87],"tasks,":[91],"named":[92],"R":[93,96],"ationale-Enhanced":[94],"and":[95,140,182,188,201,218,232],"eward":[97],"Model-Based":[98],"E":[99],"nd-to-End":[100],"S":[101,106],"ocial":[102],"I":[103],"nfluence":[104],"Dialogue":[105],"ys":[107],"t":[108],"em":[109],"(RESIST)":[110],".":[111],"streamline":[113],"system":[116],"development,":[117],"first":[119],"use":[120],"existing":[121],"datasets":[122],"prompt":[124],"teacher":[126],"LLM":[127],"for":[128],"generating":[129],"\u201cchain-of-thought\u201d":[130],"rationales,":[131],"which":[132],"then":[134],"used":[135],"enrich":[137],"enable":[141],"Supervised":[142],"Fine-Tuning":[143],"(SFT)":[144],"model.":[147],"Next,":[148],"train":[150],"reward":[152],"model":[153],"by":[154],"ranking":[155],"fine-tuned":[157],"model\u2019s":[158],"outputs,":[159],"thereby":[160],"deriving":[161],"task-specific":[162],"preferences":[163],"without":[164],"constructing":[166],"scalar":[167],"rewards.":[168],"Finally,":[169],"apply":[171],"reinforcement":[172],"learning":[173],"further":[175],"refine":[176],"system,":[178],"optimizing":[179],"responses":[183],"according":[184],"specific":[186],"tasks":[187,197],"conversational":[189],"contexts.":[190],"Experimental":[191,273],"results":[192],"three":[194],"demonstrate":[198],"adaptability":[202],"our":[204],"approach.":[206],"In":[207],"terms":[208],"task":[210,271,290],"goal":[211],"completion":[212],",":[213],"RESIST":[214,249,277],"outperforms":[215],"baseline":[216],"even":[219],"exceeds":[220],"performance":[222],"ChatGPT-driven":[224],"prompt-based":[225],"policy":[226],"planning":[227],"both":[230],"efficiency":[231],"effectiveness.":[233],"Additionally,":[234],"introduce":[236],"proactivity":[238,281],"as":[239],"novel":[241],"evaluation":[242],"metric,":[243],"enabling":[244],"us":[245],"analyze":[247],"how":[248],"influences":[251],"traits":[254],"agents,":[257],"particular":[260],"personality":[264],"tendencies":[265],"smaller-scale":[267],"language":[268,283],"during":[270],"execution.":[272],"findings":[274],"indicate":[275],"that":[276],"enhances":[278],"models,":[284],"aligning":[285],"them":[286],"more":[287],"closely":[288],"requirements.":[291],"The":[292],"source":[293],"code":[294],"will":[295],"made":[297],"publicly":[298],"available":[299],"upon":[300],"publication.":[301]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
