{"id":"https://openalex.org/W7127141310","doi":"https://doi.org/10.48550/arxiv.2601.22949","title":"Autonomous Chain-of-Thought Distillation for Graph-Based Fraud Detection","display_name":"Autonomous Chain-of-Thought Distillation for Graph-Based Fraud Detection","publication_year":2026,"publication_date":"2026-01-30","ids":{"openalex":"https://openalex.org/W7127141310","doi":"https://doi.org/10.48550/arxiv.2601.22949"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2601.22949","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5124751088","display_name":"Yuan Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Li, Yuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124844232","display_name":"Jun Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Jun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124839711","display_name":"Bryan Hooi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hooi, Bryan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121089036","display_name":"Bingsheng He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Bingsheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5124846580","display_name":"Cheng Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Cheng","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5124751088"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.5200999975204468,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.5200999975204468,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.14090000092983246,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.07880000025033951,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6492000222206116},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.5860000252723694},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5374000072479248},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.4657000005245209},{"id":"https://openalex.org/keywords/distillation","display_name":"Distillation","score":0.453900009393692},{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.387800008058548},{"id":"https://openalex.org/keywords/node","display_name":"Node (physics)","score":0.38109999895095825},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.3504999876022339}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7803999781608582},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6492000222206116},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.5860000252723694},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5374000072479248},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48649999499320984},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.4657000005245209},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.453900009393692},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4097000062465668},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.387800008058548},{"id":"https://openalex.org/C62611344","wikidata":"https://www.wikidata.org/wiki/Q1062658","display_name":"Node (physics)","level":2,"score":0.38109999895095825},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3504999876022339},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.33160001039505005},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.2833999991416931},{"id":"https://openalex.org/C86532276","wikidata":"https://www.wikidata.org/wiki/Q1184065","display_name":"Delegation","level":2,"score":0.2750000059604645},{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.27390000224113464},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.2689000070095062},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.2581999897956848},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.25519999861717224},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.25209999084472656},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2515999972820282}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2601.22949","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2601.22949","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.22949","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2601.22949","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"score":0.7875658273696899,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Graph-based":[0],"fraud":[1,46,100],"detection":[2,47,155],"on":[3,126],"text-attributed":[4],"graphs":[5],"(TAGs)":[6],"requires":[7],"jointly":[8],"modeling":[9],"rich":[10],"textual":[11],"semantics":[12],"and":[13,26,33,54,78,96,128,143,157],"relational":[14],"dependencies.":[15],"However,":[16],"existing":[17],"LLM-enhanced":[18],"GNN":[19],"approaches":[20],"are":[21,85],"constrained":[22],"by":[23],"predefined":[24,63],"prompting":[25],"decoupled":[27],"training":[28,150],"pipelines,":[29],"limiting":[30],"reasoning":[31,53,76],"autonomy":[32],"weakening":[34],"semantic-structural":[35,80],"alignment.":[36],"We":[37],"propose":[38],"FraudCoT,":[39],"a":[40,67],"unified":[41],"framework":[42],"that":[43,73,110,132],"advances":[44],"TAG-based":[45],"through":[48],"autonomous,":[49],"graph-aware":[50],"chain-of-thought":[51],"(CoT)":[52],"scalable":[55],"LLM-GNN":[56],"co-training.":[57],"To":[58],"address":[59],"the":[60,117],"limitations":[61],"of":[62,120],"prompts,":[64],"we":[65,103],"introduce":[66],"fraud-aware":[68],"selective":[69],"CoT":[70],"distillation":[71],"mechanism":[72],"generates":[74],"diverse":[75],"paths":[77],"enhances":[79],"understanding.":[81],"These":[82],"distilled":[83],"CoTs":[84],"integrated":[86],"into":[87],"node":[88],"texts,":[89],"providing":[90],"GNNs":[91],"with":[92],"enriched,":[93],"multi-hop":[94],"semantic":[95],"structural":[97],"cues":[98],"for":[99],"detection.":[101],"Furthermore,":[102],"develop":[104],"an":[105],"efficient":[106],"asymmetric":[107],"co-training":[108],"strategy":[109],"enables":[111],"end-to-end":[112],"optimization":[113],"while":[114],"significantly":[115],"reducing":[116],"computational":[118],"cost":[119],"naive":[121],"joint":[122],"training.":[123],"Extensive":[124],"experiments":[125],"public":[127],"industrial":[129],"benchmarks":[130],"demonstrate":[131],"FraudCoT":[133],"achieves":[134],"up":[135,145],"to":[136,146],"8.8%":[137],"AUPRC":[138],"improvement":[139],"over":[140],"state-of-the-art":[141],"methods":[142],"delivers":[144],"1,066x":[147],"speedup":[148],"in":[149],"throughput,":[151],"substantially":[152],"advancing":[153],"both":[154],"performance":[156],"efficiency.":[158]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-03T00:00:00"}
