{"id":"https://openalex.org/W4395443699","doi":"https://doi.org/10.48550/arxiv.2404.15058","title":"A Mechanism-Based Approach to Mitigating Harms from Persuasive Generative AI","display_name":"A Mechanism-Based Approach to Mitigating Harms from Persuasive Generative AI","publication_year":2024,"publication_date":"2024-04-23","ids":{"openalex":"https://openalex.org/W4395443699","doi":"https://doi.org/10.48550/arxiv.2404.15058"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2404.15058","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.15058","pdf_url":"https://arxiv.org/pdf/2404.15058","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2404.15058","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016317870","display_name":"Seliem El-Sayed","orcid":"https://orcid.org/0000-0003-4819-1136"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"El-Sayed, Seliem","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095886604","display_name":"Canfer Akbulut","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Akbulut, Canfer","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023716074","display_name":"Amanda McCroskery","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"McCroskery, Amanda","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020476329","display_name":"Geoff Keeling","orcid":"https://orcid.org/0000-0003-3251-4981"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Keeling, Geoff","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069438696","display_name":"Zachary Kenton","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kenton, Zachary","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095886605","display_name":"Zaria Jalan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jalan, Zaria","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036582258","display_name":"Nahema Marchal","orcid":"https://orcid.org/0000-0002-8518-3840"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Marchal, Nahema","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025585747","display_name":"Arianna Manzini","orcid":"https://orcid.org/0000-0001-7710-8974"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Manzini, Arianna","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006060802","display_name":"Toby Shevlane","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shevlane, Toby","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076883843","display_name":"Shannon Vallor","orcid":"https://orcid.org/0000-0001-7036-5222"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vallor, Shannon","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014693682","display_name":"Daniel Susser","orcid":"https://orcid.org/0000-0003-4534-6200"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Susser, Daniel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030262115","display_name":"Matija Franklin","orcid":"https://orcid.org/0000-0003-1846-8907"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Franklin, Matija","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074597914","display_name":"Sophie Bridgers","orcid":"https://orcid.org/0000-0003-4522-2697"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bridgers, Sophie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073235268","display_name":"Harry Law","orcid":"https://orcid.org/0009-0003-3381-3040"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Law, Harry","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045163381","display_name":"Matthew Rahtz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rahtz, Matthew","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072322524","display_name":"Murray Shanahan","orcid":"https://orcid.org/0000-0001-5984-2964"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shanahan, Murray","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065277725","display_name":"Michael Tessler","orcid":"https://orcid.org/0000-0001-7870-433X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tessler, Michael Henry","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052337951","display_name":"Arthur Douillard","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Douillard, Arthur","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020224050","display_name":"Tom Everitt","orcid":"https://orcid.org/0000-0003-1210-9866"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Everitt, Tom","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5081055990","display_name":"Sasha Brown","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Brown, Sasha","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":20,"corresponding_author_ids":["https://openalex.org/A5016317870"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":7,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13283","display_name":"Mental Health Research Topics","score":0.8478999733924866,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13283","display_name":"Mental Health Research Topics","score":0.8478999733924866,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.7702999711036682,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mechanism","display_name":"Mechanism (biology)","score":0.8331780433654785},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.7086004614830017},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3851985037326813},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.3616918921470642},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.3279591500759125},{"id":"https://openalex.org/keywords/cognitive-science","display_name":"Cognitive science","score":0.32322365045547485},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.25513696670532227},{"id":"https://openalex.org/keywords/epistemology","display_name":"Epistemology","score":0.19110289216041565},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.10733595490455627}],"concepts":[{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.8331780433654785},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.7086004614830017},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3851985037326813},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.3616918921470642},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3279591500759125},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.32322365045547485},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.25513696670532227},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.19110289216041565},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.10733595490455627}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2404.15058","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.15058","pdf_url":"https://arxiv.org/pdf/2404.15058","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2404.15058","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2404.15058","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2404.15058","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.15058","pdf_url":"https://arxiv.org/pdf/2404.15058","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3760447445","display_name":null,"funder_award_id":"AH/X007146/1","funder_id":"https://openalex.org/F4320334609","funder_display_name":"Arts and Humanities Research Council"}],"funders":[{"id":"https://openalex.org/F4320334609","display_name":"Arts and Humanities Research Council","ror":"https://ror.org/0505m1554"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4395443699.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2380075625","https://openalex.org/W2382997850","https://openalex.org/W2390968135","https://openalex.org/W2382213751","https://openalex.org/W2351750670","https://openalex.org/W1597848696","https://openalex.org/W2354715126","https://openalex.org/W2388563748"],"abstract_inverted_index":{"Recent":[0],"generative":[1,120,127,145],"AI":[2,23,49,65,71,111,169],"systems":[3],"have":[4],"demonstrated":[5],"more":[6],"advanced":[7],"persuasive":[8,119,126],"capabilities":[9],"and":[10,37,51,75,143,155,173,183,222,231],"are":[11,73,78],"increasingly":[12],"permeating":[13],"areas":[14],"of":[15,29,64,70,90,97,110,118,140,152,166,175,191,203,214,238,240],"life":[16],"where":[17],"they":[18,53],"can":[19,54,206],"influence":[20],"decision-making.":[21],"Generative":[22],"presents":[24],"a":[25,61,164,189],"new":[26],"risk":[27],"profile":[28],"persuasion":[30,50,72,91],"due":[31],"the":[32,58,88,95,104,107,233],"opportunity":[33],"for":[34,60,106,219],"reciprocal":[35],"exchange":[36],"prolonged":[38],"interactions.":[39],"This":[40],"has":[41],"led":[42],"to":[43,195,209],"growing":[44],"concerns":[45],"about":[46],"harms":[47,77,86,93,167,213],"from":[48,87,94,168],"how":[52],"be":[55,207],"mitigated,":[56],"highlighting":[57],"need":[59],"systematic":[62,108],"study":[63,109,232],"persuasion.":[66,98,112,197,241],"The":[67],"current":[68],"definitions":[69,117,172],"unclear":[74],"related":[76],"insufficiently":[79],"studied.":[80],"Existing":[81],"harm":[82],"mitigation":[83],"approaches":[84,204],"prioritise":[85],"outcome":[89],"over":[92],"process":[96,212],"In":[99],"this":[100],"paper,":[101],"we":[102,199],"lay":[103],"groundwork":[105],"We":[113,122,160,186],"first":[114],"put":[115,162],"forward":[116,163],"AI.":[121],"distinguish":[123],"between":[124,235],"rationally":[125],"AI,":[128,146],"which":[129,147],"relies":[130,148],"on":[131,149],"providing":[132],"relevant":[133],"facts,":[134],"sound":[135],"reasoning,":[136],"or":[137,157],"other":[138],"forms":[139],"trustworthy":[141],"evidence,":[142],"manipulative":[144],"taking":[150],"advantage":[151],"cognitive":[153],"biases":[154],"heuristics":[156],"misrepresenting":[158],"information.":[159],"also":[161],"map":[165,190],"persuasion,":[170,215],"including":[171,216],"examples":[174],"economic,":[176],"physical,":[177],"environmental,":[178],"psychological,":[179],"sociocultural,":[180],"political,":[181],"privacy,":[182],"autonomy":[184],"harm.":[185],"then":[187],"introduce":[188],"mechanisms":[192,239],"that":[193,205],"contribute":[194],"harmful":[196],"Lastly,":[198],"provide":[200],"an":[201],"overview":[202],"used":[208],"mitigate":[210],"against":[211],"prompt":[217],"engineering":[218],"manipulation":[220],"classification":[221],"red":[223],"teaming.":[224],"Future":[225],"work":[226],"will":[227],"operationalise":[228],"these":[229],"mitigations":[230],"interaction":[234],"different":[236],"types":[237]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-11T14:59:36.786465","created_date":"2025-10-10T00:00:00"}
