{"id":"https://openalex.org/W3119430426","doi":"https://doi.org/10.1109/tcyb.2020.3041265","title":"Frame-Correlation Transfers Trigger Economical Attacks on Deep Reinforcement Learning Policies","display_name":"Frame-Correlation Transfers Trigger Economical Attacks on Deep Reinforcement Learning Policies","publication_year":2021,"publication_date":"2021-01-09","ids":{"openalex":"https://openalex.org/W3119430426","doi":"https://doi.org/10.1109/tcyb.2020.3041265","mag":"3119430426","pmid":"https://pubmed.ncbi.nlm.nih.gov/33417576"},"language":"en","primary_location":{"id":"doi:10.1109/tcyb.2020.3041265","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2020.3041265","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048340011","display_name":"Xinghua Qu","orcid":"https://orcid.org/0000-0001-8072-2019"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Xinghua Qu","raw_affiliation_strings":["Computational Intelligence Lab, School of Computer Science and Engineering, Nanyang Technological University, Singapore"],"raw_orcid":"https://orcid.org/0000-0001-8072-2019","affiliations":[{"raw_affiliation_string":"Computational Intelligence Lab, School of Computer Science and Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068243197","display_name":"Yew-Soon Ong","orcid":"https://orcid.org/0000-0002-4480-169X"},"institutions":[{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]},{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]},{"id":"https://openalex.org/I4210091207","display_name":"Singapore Institute of Manufacturing Technology","ror":"https://ror.org/00f44np30","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I4210091207","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Yew-Soon Ong","raw_affiliation_strings":["Data Science and Artificial Intelligence Research Centre, School of Computer Science and Engineering, Nanyang Technological University, Singapore","Singtel Cognitive and Artificial Intelligence Lab for Enterprises, Nanyang Technological University, Singapore","Singapore Institute of Manufacturing Technology (SIMTech), Agency for Science, Technology and Research, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-4480-169X","affiliations":[{"raw_affiliation_string":"Data Science and Artificial Intelligence Research Centre, School of Computer Science and Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]},{"raw_affiliation_string":"Singtel Cognitive and Artificial Intelligence Lab for Enterprises, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]},{"raw_affiliation_string":"Singapore Institute of Manufacturing Technology (SIMTech), Agency for Science, Technology and Research, Singapore","institution_ids":["https://openalex.org/I4210091207","https://openalex.org/I115228651"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5041091856","display_name":"Abhishek Gupta","orcid":"https://orcid.org/0000-0002-6080-855X"},"institutions":[{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]},{"id":"https://openalex.org/I4210091207","display_name":"Singapore Institute of Manufacturing Technology","ror":"https://ror.org/00f44np30","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I4210091207","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Abhishek Gupta","raw_affiliation_strings":["Singapore Institute of Manufacturing Technology (SIMTech), Agency for Science, Technology and Research, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-6080-855X","affiliations":[{"raw_affiliation_string":"Singapore Institute of Manufacturing Technology (SIMTech), Agency for Science, Technology and Research, Singapore","institution_ids":["https://openalex.org/I4210091207","https://openalex.org/I115228651"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.9591,"has_fulltext":false,"cited_by_count":17,"citation_normalized_percentile":{"value":0.88267345,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"52","issue":"8","first_page":"7577","last_page":"7590"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9563999772071838,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9139000177383423,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8019753694534302},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7698001265525818},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5689079761505127},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.5653186440467834},{"id":"https://openalex.org/keywords/boosting","display_name":"Boosting (machine learning)","score":0.5142126083374023},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.5057942867279053},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.48388704657554626},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.4589991569519043},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.4484354853630066},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.4388892352581024},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3669859766960144},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.34756046533584595},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.2968684136867523},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1633196473121643}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8019753694534302},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7698001265525818},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5689079761505127},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.5653186440467834},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.5142126083374023},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.5057942867279053},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.48388704657554626},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.4589991569519043},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.4484354853630066},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.4388892352581024},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3669859766960144},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.34756046533584595},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.2968684136867523},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1633196473121643},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008390","descriptor_name":"Markov Chains","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008390","descriptor_name":"Markov Chains","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008390","descriptor_name":"Markov Chains","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012054","descriptor_name":"Reinforcement, Psychology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012054","descriptor_name":"Reinforcement, Psychology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012054","descriptor_name":"Reinforcement, Psychology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D057766","descriptor_name":"Policy","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D057766","descriptor_name":"Policy","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D057766","descriptor_name":"Policy","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":2,"locations":[{"id":"doi:10.1109/tcyb.2020.3041265","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2020.3041265","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},{"id":"pmid:33417576","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/33417576","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on cybernetics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.8100000023841858}],"awards":[],"funders":[{"id":"https://openalex.org/F4320320766","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":57,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W1573357502","https://openalex.org/W1673923490","https://openalex.org/W1945616565","https://openalex.org/W2019683663","https://openalex.org/W2053171205","https://openalex.org/W2088658556","https://openalex.org/W2089497633","https://openalex.org/W2090898720","https://openalex.org/W2112604022","https://openalex.org/W2121601095","https://openalex.org/W2125696348","https://openalex.org/W2160553465","https://openalex.org/W2170015254","https://openalex.org/W2178155017","https://openalex.org/W2257979135","https://openalex.org/W2538642367","https://openalex.org/W2559655401","https://openalex.org/W2586101872","https://openalex.org/W2612690371","https://openalex.org/W2736601468","https://openalex.org/W2746600820","https://openalex.org/W2770581177","https://openalex.org/W2782802862","https://openalex.org/W2888985868","https://openalex.org/W2904169782","https://openalex.org/W2904346582","https://openalex.org/W2908261578","https://openalex.org/W2919115771","https://openalex.org/W2941205169","https://openalex.org/W2949103145","https://openalex.org/W2963857521","https://openalex.org/W2966266966","https://openalex.org/W2968800863","https://openalex.org/W2969419629","https://openalex.org/W2972188071","https://openalex.org/W2973229164","https://openalex.org/W2981862084","https://openalex.org/W2983044655","https://openalex.org/W2986196668","https://openalex.org/W3003303990","https://openalex.org/W3007869767","https://openalex.org/W3041719080","https://openalex.org/W3047311022","https://openalex.org/W3049461753","https://openalex.org/W3092202606","https://openalex.org/W3094604376","https://openalex.org/W3106412272","https://openalex.org/W3163399111","https://openalex.org/W4250503569","https://openalex.org/W4293846201","https://openalex.org/W4298857966","https://openalex.org/W6638018090","https://openalex.org/W6692846177","https://openalex.org/W6730269975","https://openalex.org/W6743802245","https://openalex.org/W6780143859"],"related_works":["https://openalex.org/W3096874164","https://openalex.org/W2937181779","https://openalex.org/W2386410636","https://openalex.org/W1985560493","https://openalex.org/W2357975469","https://openalex.org/W2145363145","https://openalex.org/W1626977535","https://openalex.org/W4284974072","https://openalex.org/W2341346307","https://openalex.org/W4225269853"],"abstract_inverted_index":{"Adversarial":[0],"attack":[1,197],"can":[2],"be":[3,57,117],"deemed":[4],"as":[5],"a":[6,58,77,163],"necessary":[7],"prerequisite":[8],"evaluation":[9],"procedure":[10],"before":[11],"the":[12,71,96,103,108,121,169,172,177,196,205,216],"deployment":[13],"of":[14,37,76,111,123,138,156,176,219],"any":[15],"reinforcement":[16],"learning":[17],"(RL)":[18],"policy.":[19],"Most":[20],"existing":[21,201],"approaches":[22],"for":[23,119],"generating":[24,160],"adversarial":[25],"attacks":[26,64,127,221],"are":[27,31],"gradient":[28],"based":[29],"and":[30,54,149,174],"extensive,":[32],"viz.,":[33],"perturbing":[34],"every":[35,38,66],"pixel":[36],"frame.":[39],"In":[40],"contrast,":[41],"recent":[42],"advances":[43],"show":[44],"that":[45,87],"gradient-free":[46],"selective":[47],"perturbations":[48],"(i.e.,":[49,142],"attacking":[50],"only":[51],"selected":[52],"pixels":[53],"frames)":[55],"could":[56,116],"more":[59],"realistic":[60],"adversary.":[61],"However,":[62],"these":[63],"treat":[65],"frame":[67],"in":[68,83,100,128,159,222],"isolation,":[69],"ignoring":[70],"relationship":[72],"between":[73,171],"neighboring":[74],"states":[75],"Markov":[78],"decision":[79],"process;":[80],"thus":[81],"resulting":[82],"high":[84],"computational":[85,157],"complexity":[86,158,173],"tends":[88],"to":[89,95,200,209],"limit":[90],"their":[91],"real-world":[92],"plausibility":[93],"due":[94],"tight":[97],"time":[98,207],"constraint":[99],"RL.":[101,130,223],"Given":[102],"above,":[104],"this":[105,132],"article":[106],"showcases":[107],"first":[109],"study":[110],"how":[112],"transferability":[113],"across":[114],"frames":[115],"exploited":[118],"boosting":[120],"creation":[122],"minimal":[124],"yet":[125],"powerful":[126],"image-based":[129],"To":[131],"end,":[133],"we":[134],"introduce":[135],"three":[136],"types":[137],"frame-correlation":[139],"transfers":[140],"(FCTs)":[141],"anterior":[143],"case":[144],"transfer,":[145,148],"random":[146],"projection-based":[147],"principal":[150],"components-based":[151],"transfer)":[152],"with":[153],"varying":[154],"degrees":[155],"adversaries":[161],"via":[162],"genetic":[164],"algorithm.":[165],"We":[166],"empirically":[167],"demonstrate":[168],"tradeoff":[170],"potency":[175],"transfer":[178],"mechanism":[179],"by":[180],"exploring":[181],"four":[182],"fully":[183],"trained":[184],"state-of-the-art":[185],"policies":[186],"on":[187,215],"six":[188],"Atari":[189],"games.":[190],"Our":[191],"FCTs":[192],"dramatically":[193],"speed":[194],"up":[195],"generation":[198],"compared":[199],"methods,":[202],"often":[203],"reducing":[204],"computation":[206],"required":[208],"nearly":[210],"zero;":[211],"thus,":[212],"shedding":[213],"light":[214],"real":[217],"threat":[218],"real-time":[220]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":4},{"year":2021,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
