{"id":"https://openalex.org/W7152391013","doi":"https://doi.org/10.48550/arxiv.2604.07054","title":"Sell More, Play Less: Benchmarking LLM Realistic Selling Skill","display_name":"Sell More, Play Less: Benchmarking LLM Realistic Selling Skill","publication_year":2026,"publication_date":"2026-04-08","ids":{"openalex":"https://openalex.org/W7152391013","doi":"https://doi.org/10.48550/arxiv.2604.07054"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.07054","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07054","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.07054","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084719334","display_name":"Xuanbo Su","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Su, Xuanbo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133294483","display_name":"Wenhao Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Wenhao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133240301","display_name":"Le Zhan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Su, Haibo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Chen, Yunzhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yunzhang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zhan, Le","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhan, Le","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Yang, Yanqi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Yanqi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Huang, Leo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Leo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14074","display_name":"Persona Design and Applications","score":0.31119999289512634,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14074","display_name":"Persona Design and Applications","score":0.31119999289512634,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12128","display_name":"AI in Service Interactions","score":0.11400000005960464,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.09279999881982803,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.7649999856948853},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.641700029373169},{"id":"https://openalex.org/keywords/mainstream","display_name":"Mainstream","score":0.5891000032424927},{"id":"https://openalex.org/keywords/persuasion","display_name":"Persuasion","score":0.5705999732017517},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5371000170707703},{"id":"https://openalex.org/keywords/rework","display_name":"Rework","score":0.45980000495910645},{"id":"https://openalex.org/keywords/comprehension","display_name":"Comprehension","score":0.4198000133037567},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.3725000023841858}],"concepts":[{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.7649999856948853},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.641700029373169},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6010000109672546},{"id":"https://openalex.org/C2777617010","wikidata":"https://www.wikidata.org/wiki/Q18957","display_name":"Mainstream","level":2,"score":0.5891000032424927},{"id":"https://openalex.org/C2781310500","wikidata":"https://www.wikidata.org/wiki/Q1231428","display_name":"Persuasion","level":2,"score":0.5705999732017517},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5371000170707703},{"id":"https://openalex.org/C2776543023","wikidata":"https://www.wikidata.org/wiki/Q2147046","display_name":"Rework","level":2,"score":0.45980000495910645},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.4198000133037567},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.3725000023841858},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3707999885082245},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3695000112056732},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3343999981880188},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.3230000138282776},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.32249999046325684},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.32030001282691956},{"id":"https://openalex.org/C1893757","wikidata":"https://www.wikidata.org/wiki/Q3653001","display_name":"Inversion (geology)","level":3,"score":0.31200000643730164},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.30959999561309814},{"id":"https://openalex.org/C2780957164","wikidata":"https://www.wikidata.org/wiki/Q2920188","display_name":"Plain English","level":2,"score":0.30720001459121704},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.2903999984264374},{"id":"https://openalex.org/C58546491","wikidata":"https://www.wikidata.org/wiki/Q1150207","display_name":"Competitive advantage","level":2,"score":0.2883000075817108},{"id":"https://openalex.org/C168725872","wikidata":"https://www.wikidata.org/wiki/Q991663","display_name":"Sophistication","level":2,"score":0.26840001344680786},{"id":"https://openalex.org/C2778143727","wikidata":"https://www.wikidata.org/wiki/Q1820650","display_name":"Readability","level":2,"score":0.26840001344680786},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.2547999918460846},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.25189998745918274}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.07054","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07054","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.07054","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07054","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.4452991783618927,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Sales":[0],"dialogues":[1],"require":[2],"multi-turn,":[3],"goal-directed":[4],"persuasion":[5],"under":[6],"asymmetric":[7],"incentives,":[8],"which":[9],"makes":[10],"them":[11],"a":[12,34,65,93,153],"challenging":[13],"setting":[14],"for":[15,76,83,156],"large":[16],"language":[17],"models":[18],"(LLMs).":[19],"Yet":[20],"existing":[21],"dialogue":[22],"benchmarks":[23],"rarely":[24],"measure":[25],"deal":[26],"progression":[27],"and":[28,45,53,61,99,158],"outcomes.":[29],"We":[30,63],"introduce":[31],"SalesLLM":[32,114,149],"benchmark,":[33],"bilingual":[35],"(ZH/EN)":[36],"benchmark":[37,115,150,155],"derived":[38],"from":[39,49,109],"realistic":[40],"applications":[41],"covering":[42],"Financial":[43],"Services":[44],"Consumer":[46],"Goods,":[47],"built":[48],"30,074":[50],"scripted":[51],"configurations":[52],"1,805":[54],"curated":[55],"multi-turn":[56],"scenarios":[57],"with":[58,97,119,137],"controllable":[59],"difficulty":[60],"personas.":[62],"propose":[64],"fully":[66],"automatic":[67],"evaluation":[68],"pipeline":[69],"that":[70],"combines":[71],"(i)":[72],"an":[73],"LLM-based":[74],"rater":[75],"sales-process":[77],"progress,and":[78],"(ii)":[79],"fine-tuned":[80],"BERT":[81],"classifiers":[82],"end-of-dialogue":[84],"buying":[85],"intent.":[86],"To":[87],"improve":[88],"simulation":[89],"fidelity,":[90],"we":[91],"train":[92],"user":[94],"model,":[95],"CustomerLM,":[96],"SFT":[98],"DPO":[100],"on":[101],"8,000+":[102],"crowdworker-involved":[103],"sales":[104,161],"conversations,":[105],"reducing":[106],"role":[107],"inversion":[108],"17.44%":[110],"(GPT-4o)":[111],"to":[112],"8.8%.":[113],"scores":[116],"correlate":[117],"strongly":[118],"expert":[120],"human":[121],"ratings":[122],"(Pearson":[123],"r=0.98).":[124],"Experiments":[125],"across":[126],"15":[127],"mainstream":[128],"LLMs":[129,134],"reveal":[130],"substantial":[131],"variability:":[132],"top-performance":[133],"are":[135,145],"competitive":[136],"human-level":[138],"performance":[139],"while":[140],"the":[141],"less":[142],"capable":[143],"ones":[144],"worse":[146],"than":[147],"human.":[148],"serves":[151],"as":[152],"scalable":[154],"developing":[157],"evaluating":[159],"outcome-oriented":[160],"agents.":[162]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-10T00:00:00"}
