{"id":"https://openalex.org/W2588341850","doi":"https://doi.org/10.1155/2017/7809047","title":"WASTK: A Weighted Abstract Syntax Tree Kernel Method for Source Code Plagiarism Detection","display_name":"WASTK: A Weighted Abstract Syntax Tree Kernel Method for Source Code Plagiarism Detection","publication_year":2017,"publication_date":"2017-01-01","ids":{"openalex":"https://openalex.org/W2588341850","doi":"https://doi.org/10.1155/2017/7809047","mag":"2588341850"},"language":"en","primary_location":{"id":"doi:10.1155/2017/7809047","is_oa":true,"landing_page_url":"https://doi.org/10.1155/2017/7809047","pdf_url":"http://downloads.hindawi.com/journals/sp/2017/7809047.pdf","source":{"id":"https://openalex.org/S166774750","display_name":"Scientific Programming","issn_l":"1058-9244","issn":["1058-9244","1875-919X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319869","host_organization_name":"Hindawi Publishing Corporation","host_organization_lineage":["https://openalex.org/P4310319869"],"host_organization_lineage_names":["Hindawi Publishing Corporation"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Scientific Programming","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"http://downloads.hindawi.com/journals/sp/2017/7809047.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087956954","display_name":"Deqiang Fu","orcid":"https://orcid.org/0000-0002-2960-3337"},"institutions":[{"id":"https://openalex.org/I31683504","display_name":"Beijing Forestry University","ror":"https://ror.org/04xv2pc41","country_code":"CN","type":"education","lineage":["https://openalex.org/I1327237609","https://openalex.org/I31683504","https://openalex.org/I4210127390"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Deqiang Fu","raw_affiliation_strings":["Jisuan Institute of Technology, Beijing Judao Youda Network Technology Co. Ltd., No. 18 Suzhoujie St., Room 1204, Haidian District, Beijing 100080, China","School of Information Science and Technology, Beijing Forestry University, No. 35 Qinghuadong Road, Haidian District, Beijing 100083, China"],"raw_orcid":"https://orcid.org/0000-0002-2960-3337","affiliations":[{"raw_affiliation_string":"Jisuan Institute of Technology, Beijing Judao Youda Network Technology Co. Ltd., No. 18 Suzhoujie St., Room 1204, Haidian District, Beijing 100080, China","institution_ids":[]},{"raw_affiliation_string":"School of Information Science and Technology, Beijing Forestry University, No. 35 Qinghuadong Road, Haidian District, Beijing 100083, China","institution_ids":["https://openalex.org/I31683504"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100704964","display_name":"Yanyan Xu","orcid":"https://orcid.org/0000-0001-7174-6588"},"institutions":[{"id":"https://openalex.org/I31683504","display_name":"Beijing Forestry University","ror":"https://ror.org/04xv2pc41","country_code":"CN","type":"education","lineage":["https://openalex.org/I1327237609","https://openalex.org/I31683504","https://openalex.org/I4210127390"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yanyan Xu","raw_affiliation_strings":["School of Information Science and Technology, Beijing Forestry University, No. 35 Qinghuadong Road, Haidian District, Beijing 100083, China"],"raw_orcid":"https://orcid.org/0000-0001-7174-6588","affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Beijing Forestry University, No. 35 Qinghuadong Road, Haidian District, Beijing 100083, China","institution_ids":["https://openalex.org/I31683504"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035043415","display_name":"Haoran Yu","orcid":"https://orcid.org/0000-0003-4335-0740"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Haoran Yu","raw_affiliation_strings":["Jisuan Institute of Technology, Beijing Judao Youda Network Technology Co. Ltd., No. 18 Suzhoujie St., Room 1204, Haidian District, Beijing 100080, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Jisuan Institute of Technology, Beijing Judao Youda Network Technology Co. Ltd., No. 18 Suzhoujie St., Room 1204, Haidian District, Beijing 100080, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075564663","display_name":"Boyang Yang","orcid":"https://orcid.org/0000-0001-9270-730X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Boyang Yang","raw_affiliation_strings":["Jisuan Institute of Technology, Beijing Judao Youda Network Technology Co. Ltd., No. 18 Suzhoujie St., Room 1204, Haidian District, Beijing 100080, China"],"raw_orcid":"https://orcid.org/0000-0001-9270-730X","affiliations":[{"raw_affiliation_string":"Jisuan Institute of Technology, Beijing Judao Youda Network Technology Co. Ltd., No. 18 Suzhoujie St., Room 1204, Haidian District, Beijing 100080, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100704964"],"corresponding_institution_ids":["https://openalex.org/I31683504"],"apc_list":{"value":1800,"currency":"USD","value_usd":1800},"apc_paid":{"value":1800,"currency":"USD","value_usd":1800},"fwci":11.138,"has_fulltext":true,"cited_by_count":44,"citation_normalized_percentile":{"value":0.98278883,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"2017","issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9937999844551086,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9937999844551086,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11492","display_name":"Academic integrity and plagiarism","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9700999855995178,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7882489562034607},{"id":"https://openalex.org/keywords/syntax","display_name":"Syntax","score":0.7882256507873535},{"id":"https://openalex.org/keywords/abstract-syntax-tree","display_name":"Abstract syntax tree","score":0.7862608432769775},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.6344816088676453},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.6059388518333435},{"id":"https://openalex.org/keywords/abstract-syntax","display_name":"Abstract syntax","score":0.5793818235397339},{"id":"https://openalex.org/keywords/plagiarism-detection","display_name":"Plagiarism detection","score":0.5615559816360474},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.541661262512207},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5317099690437317},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.5288673043251038},{"id":"https://openalex.org/keywords/node","display_name":"Node (physics)","score":0.45865345001220703},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37437158823013306},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.36947572231292725},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.33231568336486816},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14489921927452087},{"id":"https://openalex.org/keywords/discrete-mathematics","display_name":"Discrete mathematics","score":0.0741809606552124}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7882489562034607},{"id":"https://openalex.org/C60048249","wikidata":"https://www.wikidata.org/wiki/Q37437","display_name":"Syntax","level":2,"score":0.7882256507873535},{"id":"https://openalex.org/C58646249","wikidata":"https://www.wikidata.org/wiki/Q127380","display_name":"Abstract syntax tree","level":3,"score":0.7862608432769775},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.6344816088676453},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.6059388518333435},{"id":"https://openalex.org/C114408938","wikidata":"https://www.wikidata.org/wiki/Q333373","display_name":"Abstract syntax","level":3,"score":0.5793818235397339},{"id":"https://openalex.org/C2780907237","wikidata":"https://www.wikidata.org/wiki/Q2986238","display_name":"Plagiarism detection","level":2,"score":0.5615559816360474},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.541661262512207},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5317099690437317},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.5288673043251038},{"id":"https://openalex.org/C62611344","wikidata":"https://www.wikidata.org/wiki/Q1062658","display_name":"Node (physics)","level":2,"score":0.45865345001220703},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37437158823013306},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.36947572231292725},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.33231568336486816},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14489921927452087},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.0741809606552124},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1155/2017/7809047","is_oa":true,"landing_page_url":"https://doi.org/10.1155/2017/7809047","pdf_url":"http://downloads.hindawi.com/journals/sp/2017/7809047.pdf","source":{"id":"https://openalex.org/S166774750","display_name":"Scientific Programming","issn_l":"1058-9244","issn":["1058-9244","1875-919X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319869","host_organization_name":"Hindawi Publishing Corporation","host_organization_lineage":["https://openalex.org/P4310319869"],"host_organization_lineage_names":["Hindawi Publishing Corporation"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Scientific Programming","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:63732d8db27b4d2ab82c106d68f05bb6","is_oa":false,"landing_page_url":"https://doaj.org/article/63732d8db27b4d2ab82c106d68f05bb6","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Scientific Programming, Vol 2017 (2017)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1155/2017/7809047","is_oa":true,"landing_page_url":"https://doi.org/10.1155/2017/7809047","pdf_url":"http://downloads.hindawi.com/journals/sp/2017/7809047.pdf","source":{"id":"https://openalex.org/S166774750","display_name":"Scientific Programming","issn_l":"1058-9244","issn":["1058-9244","1875-919X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319869","host_organization_name":"Hindawi Publishing Corporation","host_organization_lineage":["https://openalex.org/P4310319869"],"host_organization_lineage_names":["Hindawi Publishing Corporation"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Scientific Programming","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8700000047683716,"display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G254770905","display_name":null,"funder_award_id":"61472369","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G4751482564","display_name":null,"funder_award_id":"61472369","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G598301828","display_name":null,"funder_award_id":"2016JX06","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G7935017937","display_name":null,"funder_award_id":"2016JX06","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2588341850.pdf","grobid_xml":"https://content.openalex.org/works/W2588341850.grobid-xml"},"referenced_works_count":10,"referenced_works":["https://openalex.org/W1971195438","https://openalex.org/W2073265902","https://openalex.org/W2083278176","https://openalex.org/W2085698608","https://openalex.org/W2121412398","https://openalex.org/W2135409670","https://openalex.org/W2144211451","https://openalex.org/W2368366855","https://openalex.org/W4252211664","https://openalex.org/W4252251536"],"related_works":["https://openalex.org/W2077104824","https://openalex.org/W2536864162","https://openalex.org/W2613250302","https://openalex.org/W2390421503","https://openalex.org/W4389751695","https://openalex.org/W2095381028","https://openalex.org/W2387926336","https://openalex.org/W4294658953","https://openalex.org/W319507398","https://openalex.org/W2143166528"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3],"introduce":[4],"a":[5,47,108,120],"source":[6,44],"code":[7,45,75],"plagiarism":[8,25],"detection":[9,26],"method,":[10],"named":[11],"WASTK":[12,28,40,112],"(Weighted":[13],"Abstract":[14],"Syntax":[15],"Tree":[16],"Kernel),":[17],"for":[18],"computer":[19],"science":[20],"education.":[21],"Different":[22],"from":[23],"other":[24,32,126],"methods,":[27],"takes":[29],"some":[30],"aspects":[31],"than":[33,125],"the":[34,43,57,61,92],"similarity":[35,58],"between":[36],"programs":[37],"into":[38],"account.":[39],"firstly":[41],"transfers":[42],"of":[46,64,94],"program":[48],"to":[49,85],"an":[50,82,102],"abstract":[51,66,103],"syntax":[52,67,104],"tree":[53,62,105],"and":[54,131],"then":[55],"gets":[56],"by":[59,73,80,110],"calculating":[60],"kernel":[63],"two":[65],"trees.":[68],"To":[69],"avoid":[70],"misjudgment":[71],"caused":[72],"trivial":[74],"snippets":[76],"or":[77],"frameworks":[78],"given":[79],"instructors,":[81],"idea":[83],"similar":[84],"TF-IDF":[86],"(Term":[87],"Frequency-Inverse":[88],"Document":[89],"Frequency)":[90],"in":[91,101],"field":[93],"information":[95],"retrieval":[96],"is":[97,106,113],"applied.":[98],"Each":[99],"node":[100],"assigned":[107],"weight":[109],"TF-IDF.":[111],"evaluated":[114],"on":[115],"different":[116],"datasets":[117],"and,":[118],"as":[119],"result,":[121],"performs":[122],"much":[123],"better":[124],"popular":[127],"methods":[128],"like":[129],"Sim":[130],"JPlag.":[132]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":9},{"year":2019,"cited_by_count":7},{"year":2018,"cited_by_count":5},{"year":2017,"cited_by_count":1}],"updated_date":"2026-05-21T09:19:25.381259","created_date":"2025-10-10T00:00:00"}
