{"id":"https://openalex.org/W3096860048","doi":"https://doi.org/10.1109/access.2020.3034932","title":"Language and Obfuscation Oblivious Source Code Authorship Attribution","display_name":"Language and Obfuscation Oblivious Source Code Authorship Attribution","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3096860048","doi":"https://doi.org/10.1109/access.2020.3034932","mag":"3096860048"},"language":"en","primary_location":{"id":"doi:10.1109/access.2020.3034932","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3034932","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09245552.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09245552.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103137516","display_name":"Sarim Zafar","orcid":"https://orcid.org/0000-0002-8693-3244"},"institutions":[{"id":"https://openalex.org/I57328836","display_name":"North Dakota State University","ror":"https://ror.org/05h1bnb22","country_code":"US","type":"education","lineage":["https://openalex.org/I57328836"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sarim Zafar","raw_affiliation_strings":["North Dakota State University, Fargo, ND, USA","[Department of Computer Science, North Dakota State University, Fargo, ND, USA]"],"raw_orcid":"https://orcid.org/0000-0002-8693-3244","affiliations":[{"raw_affiliation_string":"North Dakota State University, Fargo, ND, USA","institution_ids":["https://openalex.org/I57328836"]},{"raw_affiliation_string":"[Department of Computer Science, North Dakota State University, Fargo, ND, USA]","institution_ids":["https://openalex.org/I57328836"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050971039","display_name":"Muhammad Usman Sarwar","orcid":"https://orcid.org/0000-0001-8195-0953"},"institutions":[{"id":"https://openalex.org/I57328836","display_name":"North Dakota State University","ror":"https://ror.org/05h1bnb22","country_code":"US","type":"education","lineage":["https://openalex.org/I57328836"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Muhammad Usman Sarwar","raw_affiliation_strings":["North Dakota State University, Fargo, ND, USA","[Department of Computer Science, North Dakota State University, Fargo, ND, USA]"],"raw_orcid":"https://orcid.org/0000-0001-8195-0953","affiliations":[{"raw_affiliation_string":"North Dakota State University, Fargo, ND, USA","institution_ids":["https://openalex.org/I57328836"]},{"raw_affiliation_string":"[Department of Computer Science, North Dakota State University, Fargo, ND, USA]","institution_ids":["https://openalex.org/I57328836"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091100480","display_name":"Saeed Salem","orcid":"https://orcid.org/0000-0001-6478-4674"},"institutions":[{"id":"https://openalex.org/I57328836","display_name":"North Dakota State University","ror":"https://ror.org/05h1bnb22","country_code":"US","type":"education","lineage":["https://openalex.org/I57328836"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Saeed Salem","raw_affiliation_strings":["North Dakota State University, Fargo, ND, USA","[Department of Computer Science, North Dakota State University, Fargo, ND, USA]"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"North Dakota State University, Fargo, ND, USA","institution_ids":["https://openalex.org/I57328836"]},{"raw_affiliation_string":"[Department of Computer Science, North Dakota State University, Fargo, ND, USA]","institution_ids":["https://openalex.org/I57328836"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5054186434","display_name":"Muhammad Zubair Malik","orcid":"https://orcid.org/0000-0001-5574-2288"},"institutions":[{"id":"https://openalex.org/I57328836","display_name":"North Dakota State University","ror":"https://ror.org/05h1bnb22","country_code":"US","type":"education","lineage":["https://openalex.org/I57328836"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Muhammad Zubair Malik","raw_affiliation_strings":["North Dakota State University, Fargo, ND, USA","[Department of Computer Science, North Dakota State University, Fargo, ND, USA]"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"North Dakota State University, Fargo, ND, USA","institution_ids":["https://openalex.org/I57328836"]},{"raw_affiliation_string":"[Department of Computer Science, North Dakota State University, Fargo, ND, USA]","institution_ids":["https://openalex.org/I57328836"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I57328836"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.9481,"has_fulltext":true,"cited_by_count":17,"citation_normalized_percentile":{"value":0.8151097,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"8","issue":null,"first_page":"197581","last_page":"197596"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9947999715805054,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8597701787948608},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.7493079900741577},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5149543881416321},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5096209049224854},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5016965866088867},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.47607865929603577},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3696601390838623},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.36681342124938965},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35998332500457764},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3475756049156189},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.283380925655365},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.14161470532417297}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8597701787948608},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.7493079900741577},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5149543881416321},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5096209049224854},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5016965866088867},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.47607865929603577},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3696601390838623},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.36681342124938965},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35998332500457764},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3475756049156189},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.283380925655365},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.14161470532417297},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2020.3034932","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3034932","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09245552.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:656ee93ae29f4682b570aaadfca0fbc6","is_oa":true,"landing_page_url":"https://doaj.org/article/656ee93ae29f4682b570aaadfca0fbc6","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 8, Pp 197581-197596 (2020)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2020.3034932","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.3034932","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09245552.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.5600000023841858,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320318080","display_name":"North Dakota Established Program to Stimulate Competitive Research","ror":null},{"id":"https://openalex.org/F4320338283","display_name":"Office of Experimental Program to Stimulate Competitive Research","ror":"https://ror.org/04k9mqs78"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3096860048.pdf","grobid_xml":"https://content.openalex.org/works/W3096860048.grobid-xml"},"referenced_works_count":57,"referenced_works":["https://openalex.org/W90413272","https://openalex.org/W1463623766","https://openalex.org/W1529790664","https://openalex.org/W1533861849","https://openalex.org/W1665214252","https://openalex.org/W1677182931","https://openalex.org/W1903025644","https://openalex.org/W1936750108","https://openalex.org/W1985086575","https://openalex.org/W2007337962","https://openalex.org/W2010452235","https://openalex.org/W2044555705","https://openalex.org/W2054126054","https://openalex.org/W2078111377","https://openalex.org/W2096733369","https://openalex.org/W2106487114","https://openalex.org/W2108406823","https://openalex.org/W2110127053","https://openalex.org/W2138233214","https://openalex.org/W2138621090","https://openalex.org/W2139047213","https://openalex.org/W2144270983","https://openalex.org/W2158899491","https://openalex.org/W2165533158","https://openalex.org/W2205815960","https://openalex.org/W2523437799","https://openalex.org/W2594167370","https://openalex.org/W2606377603","https://openalex.org/W2724213014","https://openalex.org/W2742948365","https://openalex.org/W2765254708","https://openalex.org/W2891865791","https://openalex.org/W2906453189","https://openalex.org/W2951005127","https://openalex.org/W2952230511","https://openalex.org/W2963026686","https://openalex.org/W2964153283","https://openalex.org/W2968917279","https://openalex.org/W2970803838","https://openalex.org/W2976414818","https://openalex.org/W2991080871","https://openalex.org/W2994689640","https://openalex.org/W2995923588","https://openalex.org/W3099206234","https://openalex.org/W3100927979","https://openalex.org/W3215498156","https://openalex.org/W4236036072","https://openalex.org/W6603649106","https://openalex.org/W6631592667","https://openalex.org/W6631943919","https://openalex.org/W6637242042","https://openalex.org/W6676179522","https://openalex.org/W6683738474","https://openalex.org/W6687750345","https://openalex.org/W6727380541","https://openalex.org/W6766196973","https://openalex.org/W6767164110"],"related_works":["https://openalex.org/W2389214306","https://openalex.org/W4293226380","https://openalex.org/W2965083567","https://openalex.org/W4235240664","https://openalex.org/W1838576100","https://openalex.org/W2757182831","https://openalex.org/W2095886385","https://openalex.org/W2089704382","https://openalex.org/W2100349471","https://openalex.org/W3081644756"],"abstract_inverted_index":{"Source":[0,28],"Code":[1,29,218],"Authorship":[2,30],"Attribution":[3,31],"can":[4,99,112],"answer":[5],"many":[6],"interesting":[7],"questions":[8],"such":[9,119,233],"as:":[10],"Who":[11],"wrote":[12],"the":[13,18,80,84,90,94,104,151,155,164,169,189,200,270],"malicious":[14],"source":[15,19,42,57,85,109,165,178,196],"code?":[16],"Is":[17],"code":[20,43,86,197],"plagiarized,":[21],"and":[22,48,87,115,248],"does":[23,238],"it":[24,237],"infringe":[25],"on":[26,89,216],"copyright?":[27],"is":[32,46,245,266],"done":[33],"by":[34,168,181],"observing":[35],"distinctive":[36],"patterns":[37,52],"of":[38,79,96,108,260,272],"style":[39,97],"in":[40,188,232],"a":[41,69,133,143,160,234,277],"whose":[44],"author":[45,171],"unknown":[47],"comparing":[49],"them":[50],"with":[51],"learned":[53],"from":[54],"known":[55],"authors'":[56],"codes.":[58],"In":[59,176],"this":[60],"paper,":[61],"we":[62],"present":[63],"an":[64,258],"efficient":[65,249],"approach":[66,102,141,215,244],"to":[67,131,153,159,173,208,256],"learn":[68,132],"novel":[70],"representation":[71,135],"using":[72,125],"deep":[73],"metric":[74],"learning.":[75],"The":[76],"existing":[77,251],"state":[78],"art":[81],"approaches":[82],"tokenize":[83],"work":[88],"keyword":[91],"level,":[92],"limiting":[93],"elements":[95],"they":[98],"consider.":[100],"Our":[101,140,243],"uses":[103,142,206],"raw":[105],"character":[106,157],"stream":[107,158],"code.":[110],"It":[111],"examine":[113],"keywords":[114],"different":[116,182,224],"stylistic":[117],"features":[118],"as":[120],"variable":[121],"naming":[122],"conventions":[123],"or":[124],"tabs":[126],"vs.":[127],"spaces,":[128],"enabling":[129],"us":[130],"richer":[134],"than":[136,250,268],"other":[137],"keyword-based":[138],"approaches.":[139],"character-level":[144],"Convolutional":[145],"Neural":[146],"Network":[147],"(CNN).":[148],"We":[149,192,212,227,253],"train":[150],"CNN":[152],"map":[154],"input":[156],"dense":[161],"vector,":[162],"mapping":[163],"codes":[166,179],"authored":[167],"same":[170],"close":[172],"each":[174],"other.":[175],"contrast,":[177],"written":[180],"programmers":[183],"are":[184],"mapped":[185],"farther":[186],"apart":[187],"embedding":[190],"space.":[191],"then":[193],"feed":[194],"these":[195],"vectors":[198],"into":[199],"K-nearest":[201],"neighbor":[202],"(KNN)":[203],"classifier":[204],"that":[205,236],"Manhattan-distance":[207],"perform":[209],"authorship":[210],"attribution.":[211],"validated":[213],"our":[214,229],"Google":[217],"Jam":[219],"(GCJ)":[220],"dataset":[221,231],"across":[222,262],"three":[223],"programming":[225],"languages.":[226],"prepare":[228],"large-scale":[230],"way":[235],"not":[239],"induce":[240],"type-I":[241],"error.":[242],"more":[246,267,279],"scalable":[247],"methods.":[252],"were":[254],"able":[255],"achieve":[257],"accuracy":[259],"84.94%":[261],"20,458":[263],"authors,":[264],"which":[265],"twice":[269],"scale":[271],"any":[273],"previous":[274],"study":[275],"under":[276],"much":[278],"challenging":[280],"setting.":[281]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":3}],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
