{"id":"https://openalex.org/W7135176806","doi":"https://doi.org/10.1145/3800961","title":"MetaRAG: Identifying Website Owner Using Meta-Path-Guided Dynamic Graph Retrieval-Augmented Generation","display_name":"MetaRAG: Identifying Website Owner Using Meta-Path-Guided Dynamic Graph Retrieval-Augmented Generation","publication_year":2026,"publication_date":"2026-03-13","ids":{"openalex":"https://openalex.org/W7135176806","doi":"https://doi.org/10.1145/3800961"},"language":"en","primary_location":{"id":"doi:10.1145/3800961","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3800961","pdf_url":null,"source":{"id":"https://openalex.org/S4394735545","display_name":"ACM Transactions on Information Systems","issn_l":"1046-8188","issn":["1046-8188","1558-2868"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Information Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5061270214","display_name":"Cheng Tu","orcid":"https://orcid.org/0000-0002-4223-7298"},"institutions":[{"id":"https://openalex.org/I4210149848","display_name":"National Synchrotron Radiation Laboratory","ror":"https://ror.org/03rx2tr07","country_code":"CN","type":"facility","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366","https://openalex.org/I4210149848"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cheng Tu","raw_affiliation_strings":["National University of Defense Technology, Hefei, China and Anhui Province Key Laboratory of Cyberspace Security Situation Awareness and Evaluation, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0002-4223-7298","affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Hefei, China and Anhui Province Key Laboratory of Cyberspace Security Situation Awareness and Evaluation, Hefei, China","institution_ids":["https://openalex.org/I4210149848"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089377262","display_name":"Yunshan Ma","orcid":"https://orcid.org/0000-0003-3038-5389"},"institutions":[{"id":"https://openalex.org/I79891267","display_name":"Singapore Management University","ror":"https://ror.org/050qmg959","country_code":"SG","type":"education","lineage":["https://openalex.org/I79891267"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Yunshan Ma","raw_affiliation_strings":["School of Computing and Information Systems, Singapore Management University, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0003-3038-5389","affiliations":[{"raw_affiliation_string":"School of Computing and Information Systems, Singapore Management University, Singapore, Singapore","institution_ids":["https://openalex.org/I79891267"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035286001","display_name":"Bingyang Guo","orcid":"https://orcid.org/0000-0002-1166-2830"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bingyang Guo","raw_affiliation_strings":["National University of Defense Technology, Anhui, China and Anhui Province Key Laboratory of Cyberspace Security Situation Awareness and Evaluation, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0002-1166-2830","affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Anhui, China and Anhui Province Key Laboratory of Cyberspace Security Situation Awareness and Evaluation, Hefei, China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Qianyu Li","orcid":"https://orcid.org/0000-0002-7137-999X"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qianyu Li","raw_affiliation_strings":["National University of Defense Technology, Anhui, China and Anhui Province Key Laboratory of Cyberspace Security Situation Awareness and Evaluation, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0002-7137-999X","affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Anhui, China and Anhui Province Key Laboratory of Cyberspace Security Situation Awareness and Evaluation, Hefei, China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yang Li","orcid":"https://orcid.org/0009-0005-9585-3472"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Li","raw_affiliation_strings":["National University of Defense Technology, Anhui, China and Anhui Province Key Laboratory of Cyberspace Security Situation Awareness and Evaluation, Hefei, China"],"raw_orcid":"https://orcid.org/0009-0005-9585-3472","affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Anhui, China and Anhui Province Key Laboratory of Cyberspace Security Situation Awareness and Evaluation, Hefei, China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Min Zhang","orcid":"https://orcid.org/0000-0002-6654-7610"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Min Zhang","raw_affiliation_strings":["National University of Defense Technology, Anhui, China and Anhui Province Key Laboratory of Cyberspace Security Situation Awareness and Evaluation, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0002-6654-7610","affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Anhui, China and Anhui Province Key Laboratory of Cyberspace Security Situation Awareness and Evaluation, Hefei, China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128992672","display_name":"Fan Shi","orcid":null},"institutions":[{"id":"https://openalex.org/I4210149848","display_name":"National Synchrotron Radiation Laboratory","ror":"https://ror.org/03rx2tr07","country_code":"CN","type":"facility","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366","https://openalex.org/I4210149848"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fan Shi","raw_affiliation_strings":["National University of Defense Technology, Hefei, China and Anhui Province Key Laboratory of Cyberspace Security Situation Awareness and Evaluation, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0003-4533-2706","affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Hefei, China and Anhui Province Key Laboratory of Cyberspace Security Situation Awareness and Evaluation, Hefei, China","institution_ids":["https://openalex.org/I4210149848"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5128993320","display_name":"Xiang Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiang Wang","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0002-6148-6329","affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.30082753,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"44","issue":"4","first_page":"1","last_page":"33"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.2815999984741211,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.2815999984741211,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.13779999315738678,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.09009999781847,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.6611999869346619},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6384000182151794},{"id":"https://openalex.org/keywords/credibility","display_name":"Credibility","score":0.6225000023841858},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.5479999780654907},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5004000067710876},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.49939998984336853},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.4758000075817108}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8962000012397766},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.6611999869346619},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6384000182151794},{"id":"https://openalex.org/C2780224610","wikidata":"https://www.wikidata.org/wiki/Q1530061","display_name":"Credibility","level":2,"score":0.6225000023841858},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6202999949455261},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.5479999780654907},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5004000067710876},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.49939998984336853},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.4758000075817108},{"id":"https://openalex.org/C2987255567","wikidata":"https://www.wikidata.org/wiki/Q33002955","display_name":"Knowledge graph","level":2,"score":0.4607999920845032},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.42989999055862427},{"id":"https://openalex.org/C1173588","wikidata":"https://www.wikidata.org/wiki/Q6554294","display_name":"Link analysis","level":2,"score":0.3506999909877777},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3443000018596649},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.29829999804496765},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.2980000078678131},{"id":"https://openalex.org/C197046077","wikidata":"https://www.wikidata.org/wiki/Q785337","display_name":"Web mining","level":3,"score":0.2741999924182892},{"id":"https://openalex.org/C118643609","wikidata":"https://www.wikidata.org/wiki/Q189210","display_name":"Web application","level":2,"score":0.2506999969482422}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3800961","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3800961","pdf_url":null,"source":{"id":"https://openalex.org/S4394735545","display_name":"ACM Transactions on Information Systems","issn_l":"1046-8188","issn":["1046-8188","1558-2868"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Information Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure","score":0.6293723583221436}],"awards":[{"id":"https://openalex.org/G6948229166","display_name":null,"funder_award_id":"2023ZD0121102","funder_id":"https://openalex.org/F4320329860","funder_display_name":"National Science and Technology Major Project"}],"funders":[{"id":"https://openalex.org/F4320329860","display_name":"National Science and Technology Major Project","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W2012833704","https://openalex.org/W2145349611","https://openalex.org/W2613843087","https://openalex.org/W2782696945","https://openalex.org/W3012871709","https://openalex.org/W3168547639","https://openalex.org/W4284713043","https://openalex.org/W4322762565","https://openalex.org/W4362588215","https://openalex.org/W4386291602","https://openalex.org/W4389279191","https://openalex.org/W4389520779","https://openalex.org/W4390692489","https://openalex.org/W4391407054","https://openalex.org/W4400222836","https://openalex.org/W4401671778","https://openalex.org/W4416379250"],"related_works":[],"abstract_inverted_index":{"Website":[0],"owner":[1,38,230],"identification":[2,39],"aims":[3],"to":[4,7,57,153,160,184,202],"link":[5],"websites":[6],"their":[8],"real-world":[9,198],"owners,":[10],"which":[11],"is":[12],"crucial":[13],"for":[14,25,36,226],"credibility":[15],"assessment":[16],"and":[17,23,31,63,83,136,156,171,180,187],"information":[18,21,163],"provenance":[19],"in":[20,27,116,216],"retrieval":[22,152],"vital":[24],"applications":[26],"cybersecurity,":[28],"Internet":[29],"governance,":[30],"digital":[32],"regulation.":[33],"Existing":[34],"approaches":[35],"website":[37,229],"primarily":[40],"rely":[41],"on":[42,168,195],"querying":[43],"infrastructure":[44,75,134],"registration":[45,61],"records":[46,62],"or":[47,59,164],"analyzing":[48],"webpage":[49,65,138],"content.":[50,66],"However,":[51],"these":[52],"methods":[53],"often":[54],"fail":[55],"due":[56],"incomplete":[58],"outdated":[60],"sparse":[64],"We":[67,192],"observe":[68],"that":[69,106,132,150,178],"inter-website":[70],"relationships,":[71],"derived":[72],"from":[73],"shared":[74],"data":[76,135],"such":[77],"as":[78],"primary":[79],"domains,":[80],"IP":[81],"blocks,":[82],"geolocations,":[84],"can":[85],"provide":[86],"valuable":[87],"but":[88],"underutilized":[89],"ownership":[90,190],"cues.":[91],"To":[92],"exploit":[93],"this":[94],"insight,":[95],"we":[96],"propose":[97],"MetaRAG,":[98],"a":[99,117,127,141,145,173],"meta-path-guided":[100,146],"dynamic":[101,147],"graph":[102,129],"retrieval-augmented":[103],"generation":[104],"framework":[105],"performs":[107],"reasoning":[108,148,225],"using":[109],"large":[110,222],"language":[111,223],"models":[112],"over":[113,205],"ownership-relevant":[114,154],"paths":[115,183],"website-centric":[118],"knowledge":[119,128,220],"graph.":[120],"MetaRAG":[121,194],"consists":[122],"of":[123,213],"three":[124],"components:":[125],"(1)":[126],"construction":[130],"module":[131,149,177],"integrates":[133],"crawled":[137],"content":[139],"into":[140],"unified":[142],"representation;":[143],"(2)":[144],"constrains":[151],"meta-paths":[155],"adaptively":[157],"decides":[158],"whether":[159],"retrieve":[161],"more":[162,227],"perform":[165],"inference":[166],"based":[167],"evidence":[169,175],"completeness;":[170],"(3)":[172],"multi-path":[174],"refinement":[176],"aggregates":[179],"scores":[181],"retrieved":[182],"suppress":[185],"noise":[186],"distill":[188],"high-confidence":[189],"signals.":[191],"evaluate":[193],"two":[196],"constructed":[197],"datasets,":[199],"achieving":[200],"up":[201],"6.82%":[203],"improvement":[204],"strong":[206],"baselines.":[207],"The":[208],"results":[209],"demonstrate":[210],"the":[211],"effectiveness":[212],"our":[214],"approach":[215],"combining":[217],"structured":[218],"web":[219],"with":[221],"model-based":[224],"accurate":[228],"identification.":[231]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-14T00:00:00"}
