{"id":"https://openalex.org/W3207841299","doi":"https://doi.org/10.1109/tcyb.2021.3116762","title":"Graph-Attention-Based Casual Discovery With Trust Region-Navigated Clipping Policy Optimization","display_name":"Graph-Attention-Based Casual Discovery With Trust Region-Navigated Clipping Policy Optimization","publication_year":2021,"publication_date":"2021-10-20","ids":{"openalex":"https://openalex.org/W3207841299","doi":"https://doi.org/10.1109/tcyb.2021.3116762","mag":"3207841299","pmid":"https://pubmed.ncbi.nlm.nih.gov/34665751"},"language":"en","primary_location":{"id":"doi:10.1109/tcyb.2021.3116762","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2021.3116762","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2412.19578","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101707300","display_name":"Shixuan Liu","orcid":"https://orcid.org/0000-0003-4780-3890"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shixuan Liu","raw_affiliation_strings":["College of Systems Engineering, National University of Defense Technology, Changsha, China"],"raw_orcid":"https://orcid.org/0000-0003-4780-3890","affiliations":[{"raw_affiliation_string":"College of Systems Engineering, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081897060","display_name":"Yanghe Feng","orcid":"https://orcid.org/0000-0003-1608-8695"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanghe Feng","raw_affiliation_strings":["College of Systems Engineering, National University of Defense Technology, Changsha, China"],"raw_orcid":"https://orcid.org/0000-0003-1608-8695","affiliations":[{"raw_affiliation_string":"College of Systems Engineering, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038637903","display_name":"Keyu Wu","orcid":"https://orcid.org/0000-0001-8493-0712"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Keyu Wu","raw_affiliation_strings":["College of Systems Engineering, National University of Defense Technology, Changsha, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Systems Engineering, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101851407","display_name":"Guangquan Cheng","orcid":"https://orcid.org/0000-0002-3166-477X"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guangquan Cheng","raw_affiliation_strings":["College of Systems Engineering, National University of Defense Technology, Changsha, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Systems Engineering, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101842754","display_name":"Jincai Huang","orcid":"https://orcid.org/0000-0003-4515-1518"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jincai Huang","raw_affiliation_strings":["College of Systems Engineering, National University of Defense Technology, Changsha, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Systems Engineering, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5115588589","display_name":"Zhong Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhong Liu","raw_affiliation_strings":["College of Systems Engineering, National University of Defense Technology, Changsha, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Systems Engineering, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.2594,"has_fulltext":true,"cited_by_count":10,"citation_normalized_percentile":{"value":0.84085194,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"53","issue":"4","first_page":"2311","last_page":"2324"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9879999756813049,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.9861000180244446,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6893454194068909},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5749765634536743},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5415663123130798},{"id":"https://openalex.org/keywords/latent-variable","display_name":"Latent variable","score":0.5126542448997498},{"id":"https://openalex.org/keywords/optimization-problem","display_name":"Optimization problem","score":0.45875027775764465},{"id":"https://openalex.org/keywords/grasp","display_name":"GRASP","score":0.43842968344688416},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4298498034477234},{"id":"https://openalex.org/keywords/a-priori-and-a-posteriori","display_name":"A priori and a posteriori","score":0.42223358154296875},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4195294976234436},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.41053104400634766},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.40636634826660156},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3249322474002838},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.24796339869499207},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.2424379587173462},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15735560655593872}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6893454194068909},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5749765634536743},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5415663123130798},{"id":"https://openalex.org/C51167844","wikidata":"https://www.wikidata.org/wiki/Q4422623","display_name":"Latent variable","level":2,"score":0.5126542448997498},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.45875027775764465},{"id":"https://openalex.org/C171268870","wikidata":"https://www.wikidata.org/wiki/Q1486676","display_name":"GRASP","level":2,"score":0.43842968344688416},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4298498034477234},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.42223358154296875},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4195294976234436},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41053104400634766},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.40636634826660156},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3249322474002838},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.24796339869499207},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2424379587173462},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15735560655593872},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tcyb.2021.3116762","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2021.3116762","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},{"id":"pmid:34665751","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/34665751","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on cybernetics","raw_type":null},{"id":"pmh:oai:arXiv.org:2412.19578","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2412.19578","pdf_url":"https://arxiv.org/pdf/2412.19578","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2412.19578","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2412.19578","pdf_url":"https://arxiv.org/pdf/2412.19578","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2118812850","display_name":null,"funder_award_id":"71701205","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G547299875","display_name":null,"funder_award_id":"2020JJ5675","funder_id":"https://openalex.org/F4320322843","funder_display_name":"Natural Science Foundation of\u00a0Hunan Province"},{"id":"https://openalex.org/G6306360950","display_name":null,"funder_award_id":"62001495","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322843","display_name":"Natural Science Foundation of\u00a0Hunan Province","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3207841299.pdf","grobid_xml":"https://content.openalex.org/works/W3207841299.grobid-xml"},"referenced_works_count":53,"referenced_works":["https://openalex.org/W563711960","https://openalex.org/W1501856433","https://openalex.org/W1530964327","https://openalex.org/W1851422093","https://openalex.org/W1977446441","https://openalex.org/W1987124340","https://openalex.org/W1993411524","https://openalex.org/W2036363967","https://openalex.org/W2073307618","https://openalex.org/W2116341502","https://openalex.org/W2119717200","https://openalex.org/W2146545355","https://openalex.org/W2151226328","https://openalex.org/W2163166770","https://openalex.org/W2165190832","https://openalex.org/W2168175751","https://openalex.org/W2201581102","https://openalex.org/W2344953603","https://openalex.org/W2492794003","https://openalex.org/W2553303224","https://openalex.org/W2557632452","https://openalex.org/W2580909119","https://openalex.org/W2736601468","https://openalex.org/W2755310417","https://openalex.org/W2789929276","https://openalex.org/W2808914202","https://openalex.org/W2899806036","https://openalex.org/W2905181441","https://openalex.org/W2908261578","https://openalex.org/W2909711564","https://openalex.org/W2949383815","https://openalex.org/W2963929190","https://openalex.org/W2964199361","https://openalex.org/W2976993238","https://openalex.org/W2987232971","https://openalex.org/W2990022244","https://openalex.org/W2996051514","https://openalex.org/W3098710260","https://openalex.org/W3106525726","https://openalex.org/W4220671231","https://openalex.org/W4294558607","https://openalex.org/W4297733535","https://openalex.org/W4298091299","https://openalex.org/W4302423442","https://openalex.org/W6638018090","https://openalex.org/W6679709731","https://openalex.org/W6682361391","https://openalex.org/W6683204974","https://openalex.org/W6754506371","https://openalex.org/W6760181788","https://openalex.org/W6761805307","https://openalex.org/W6763561447","https://openalex.org/W6768741345"],"related_works":["https://openalex.org/W2163296013","https://openalex.org/W2743859443","https://openalex.org/W2326995835","https://openalex.org/W165915117","https://openalex.org/W2059402478","https://openalex.org/W2123347777","https://openalex.org/W4387804363","https://openalex.org/W2019547100","https://openalex.org/W2477150073","https://openalex.org/W2515493494"],"abstract_inverted_index":{"In":[0],"many":[1],"domains":[2],"of":[3,60,66,73,164,204],"empirical":[4],"sciences,":[5],"discovering":[6],"the":[7,47,57,61,64,70,77,156,161,188,192],"causal":[8,37,131],"structure":[9],"within":[10],"variables":[11],"remains":[12],"an":[13],"indispensable":[14],"task.":[15],"Recently,":[16],"to":[17,44,56,83,159],"tackle":[18],"unoriented":[19],"edges":[20],"or":[21],"latent":[22],"assumptions":[23],"violation":[24],"suffered":[25],"by":[26],"conventional":[27],"methods,":[28],"researchers":[29],"formulated":[30],"a":[31,41,110,123,168],"reinforcement":[32],"learning":[33],"(RL)":[34],"procedure":[35,62],"for":[36,46,113,130],"discovery":[38,132],"and":[39,69,86,139,149,199,207],"equipped":[40],"REINFORCE":[42,80,153],"algorithm":[43],"search":[45,137],"best":[48],"rewarded":[49],"directed":[50],"acyclic":[51],"graph.":[52],"The":[53],"two":[54],"keys":[55],"overall":[58],"performance":[59,88],"are":[63],"robustness":[65],"RL":[67,194],"methods":[68],"efficient":[71,162],"encoding":[72,163],"variables.":[74],"However,":[75],"on":[76],"one":[78],"hand,":[79,158],"is":[81,109],"prone":[82],"local":[84],"convergence":[85],"unstable":[87],"during":[89],"training.":[90],"Neither":[91],"trust":[92,124],"region":[93],"policy":[94,101,127,142],"optimization,":[95,143],"being":[96],"computationally":[97],"expensive,":[98],"nor":[99],"proximal":[100],"optimization":[102,115,128,208],"(PPO),":[103],"suffering":[104],"from":[105],"aggregate":[106],"constraint":[107],"deviation,":[108],"decent":[111],"alternative":[112],"combinatory":[114],"problems":[116],"with":[117,146],"considerable":[118],"individual":[119],"subactions.":[120],"We":[121],"propose":[122,167],"region-navigated":[125],"clipping":[126],"method":[129,190,195],"that":[133,175],"guarantees":[134],"both":[135,197],"better":[136],"efficiency":[138],"steadiness":[140],"in":[141,144,196,202],"comparison":[145],"REINFORCE,":[147],"PPO,":[148],"our":[150],"prioritized":[151],"sampling-guided":[152],"implementation.":[154],"On":[155],"other":[157],"boost":[160],"variables,":[165],"we":[166],"refined":[169],"graph":[170],"attention":[171],"encoder":[172],"called":[173],"SDGAT":[174],"can":[176],"grasp":[177],"more":[178],"feature":[179],"information":[180],"without":[181],"priori":[182],"neighborhood":[183],"information.":[184],"With":[185],"these":[186],"improvements,":[187],"proposed":[189],"outperforms":[191],"former":[193],"synthetic":[198],"benchmark":[200],"datasets":[201],"terms":[203],"output":[205],"results":[206],"robustness.":[209]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
