{"id":"https://openalex.org/W7111136384","doi":"https://doi.org/10.48550/arxiv.2512.06638","title":"The Impact of Data Characteristics on GNN Evaluation for Detecting Fake News","display_name":"The Impact of Data Characteristics on GNN Evaluation for Detecting Fake News","publication_year":2025,"publication_date":"2025-12-07","ids":{"openalex":"https://openalex.org/W7111136384","doi":"https://doi.org/10.48550/arxiv.2512.06638"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2512.06638","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.06638","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2512.06638","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Karn, Isha","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Karn, Isha","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Jensen, David","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jensen, David","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11147","display_name":"Misinformation and Its Impacts","score":0.8593999743461609,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11147","display_name":"Misinformation and Its Impacts","score":0.8593999743461609,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.0868000015616417,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.006800000090152025,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6060000061988831},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5375999808311462},{"id":"https://openalex.org/keywords/shuffling","display_name":"Shuffling","score":0.47749999165534973},{"id":"https://openalex.org/keywords/node","display_name":"Node (physics)","score":0.41449999809265137},{"id":"https://openalex.org/keywords/synthetic-data","display_name":"Synthetic data","score":0.41370001435279846},{"id":"https://openalex.org/keywords/network-topology","display_name":"Network topology","score":0.40799999237060547},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.39879998564720154},{"id":"https://openalex.org/keywords/social-graph","display_name":"Social graph","score":0.3862999975681305},{"id":"https://openalex.org/keywords/test-data","display_name":"Test data","score":0.3785000145435333}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7541000247001648},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6060000061988831},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5375999808311462},{"id":"https://openalex.org/C167927819","wikidata":"https://www.wikidata.org/wiki/Q1930567","display_name":"Shuffling","level":2,"score":0.47749999165534973},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4634999930858612},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4629000127315521},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4593999981880188},{"id":"https://openalex.org/C62611344","wikidata":"https://www.wikidata.org/wiki/Q1062658","display_name":"Node (physics)","level":2,"score":0.41449999809265137},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.41370001435279846},{"id":"https://openalex.org/C199845137","wikidata":"https://www.wikidata.org/wiki/Q145490","display_name":"Network topology","level":2,"score":0.40799999237060547},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.39879998564720154},{"id":"https://openalex.org/C2777522414","wikidata":"https://www.wikidata.org/wiki/Q648457","display_name":"Social graph","level":3,"score":0.3862999975681305},{"id":"https://openalex.org/C16910744","wikidata":"https://www.wikidata.org/wiki/Q7705759","display_name":"Test data","level":2,"score":0.3785000145435333},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3718999922275543},{"id":"https://openalex.org/C60908668","wikidata":"https://www.wikidata.org/wiki/Q690207","display_name":"Perceptron","level":3,"score":0.3700000047683716},{"id":"https://openalex.org/C2993807640","wikidata":"https://www.wikidata.org/wiki/Q103709453","display_name":"Attention network","level":2,"score":0.35409998893737793},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3499000072479248},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.3463999927043915},{"id":"https://openalex.org/C179717631","wikidata":"https://www.wikidata.org/wiki/Q2991667","display_name":"Multilayer perceptron","level":3,"score":0.3452000021934509},{"id":"https://openalex.org/C2988224531","wikidata":"https://www.wikidata.org/wiki/Q20830730","display_name":"Network structure","level":2,"score":0.32260000705718994},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.32100000977516174},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.31949999928474426},{"id":"https://openalex.org/C2781170535","wikidata":"https://www.wikidata.org/wiki/Q30587856","display_name":"Noisy data","level":2,"score":0.28040000796318054},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2718000113964081},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.26910001039505005},{"id":"https://openalex.org/C106937863","wikidata":"https://www.wikidata.org/wiki/Q7236518","display_name":"Power graph analysis","level":3,"score":0.2612999975681305},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2581000030040741},{"id":"https://openalex.org/C71901391","wikidata":"https://www.wikidata.org/wiki/Q7126699","display_name":"Upload","level":2,"score":0.25769999623298645}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2512.06638","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.06638","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2512.06638","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.06638","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Graph":[0],"neural":[1],"networks":[2],"(GNNs)":[3],"are":[4,43,132,172,191],"widely":[5,207],"used":[6,34,208],"for":[7],"the":[8,15,31,48,90,102,118,177,214,223],"detection":[9],"of":[10,20,30,50,104,120,170,216,225],"fake":[11],"news":[12,21],"by":[13],"modeling":[14,74,217],"content":[16],"and":[17,40,112,193,220],"propagation":[18,54],"structure":[19,121,155,194],"articles":[22],"on":[23,185],"social":[24],"media.":[25],"We":[26,76,94,138],"show":[27,95],"that":[28,52,65,88,96,140,154,167,206],"two":[29],"most":[32],"commonly":[33],"benchmark":[35,78],"data":[36,58],"sets":[37,59],"-":[38,42],"GossipCop":[39],"PolitiFact":[41],"poorly":[44],"suited":[45],"to":[46,71],"evaluating":[47],"utility":[49,215],"models":[51],"use":[53],"structure.":[55],"Specifically,":[56],"these":[57,123,161],"exhibit":[60],"shallow,":[61],"ego-like":[62],"graph":[63,231],"topologies":[64],"provide":[66,203],"little":[67],"or":[68,99,134],"no":[69],"ability":[70],"differentiate":[72],"among":[73],"methods.":[75],"systematically":[77],"five":[79],"GNN":[80],"architectures":[81],"against":[82],"a":[83,157],"structure-agnostic":[84],"multilayer":[85],"perceptron":[86],"(MLP)":[87],"uses":[89],"same":[91],"node":[92,130,189],"features.":[93],"MLPs":[97],"match":[98],"closely":[100],"trail":[101],"performance":[103,107,141],"GNNs,":[105],"with":[106,227],"gaps":[108],"often":[109],"within":[110],"1-2%":[111],"overlapping":[113],"confidence":[114],"intervals.":[115],"To":[116],"isolate":[117],"contribution":[119],"in":[122,160],"datasets,":[124],"we":[125],"conduct":[126],"controlled":[127],"experiments":[128],"where":[129,188],"features":[131,190],"shuffled":[133],"edge":[135,150],"structures":[136],"randomized.":[137],"find":[139],"collapses":[142],"under":[143,149],"feature":[144],"shuffling":[145],"but":[146],"remains":[147],"stable":[148],"randomization.":[151],"This":[152],"suggests":[153],"plays":[156],"negligible":[158],"role":[159],"benchmarks.":[162],"Structural":[163],"analysis":[164],"further":[165],"reveals":[166],"over":[168],"75%":[169],"nodes":[171],"only":[173],"one":[174],"hop":[175],"from":[176],"root,":[178],"exhibiting":[179],"minimal":[180],"structural":[181,218],"diversity.":[182],"In":[183],"contrast,":[184],"synthetic":[186],"datasets":[187,226],"noisy":[192],"is":[195],"informative,":[196],"GNNs":[197],"significantly":[198],"outperform":[199],"MLPs.":[200],"These":[201],"findings":[202],"strong":[204],"evidence":[205],"benchmarks":[209],"do":[210],"not":[211],"meaningfully":[212],"test":[213],"features,":[219],"they":[221],"motivate":[222],"development":[224],"richer,":[228],"more":[229],"diverse":[230],"topologies.":[232]},"counts_by_year":[],"updated_date":"2025-12-10T02:49:46.989445","created_date":"2025-12-10T00:00:00"}
