{"id":"https://openalex.org/W3089552900","doi":"https://doi.org/10.1109/ijcnn48605.2020.9207647","title":"Zero-Shot Source Code Author Identification: A Lexicon and Layout Independent Approach","display_name":"Zero-Shot Source Code Author Identification: A Lexicon and Layout Independent Approach","publication_year":2020,"publication_date":"2020-07-01","ids":{"openalex":"https://openalex.org/W3089552900","doi":"https://doi.org/10.1109/ijcnn48605.2020.9207647","mag":"3089552900"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn48605.2020.9207647","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn48605.2020.9207647","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020803752","display_name":"Pegah Hozhabrierdi","orcid":"https://orcid.org/0000-0003-0524-6811"},"institutions":[{"id":"https://openalex.org/I70983195","display_name":"Syracuse University","ror":"https://ror.org/025r5qe02","country_code":"US","type":"education","lineage":["https://openalex.org/I70983195"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Pegah Hozhabrierdi","raw_affiliation_strings":["Department of EECS, Syracuse University, Syracuse, USA"],"affiliations":[{"raw_affiliation_string":"Department of EECS, Syracuse University, Syracuse, USA","institution_ids":["https://openalex.org/I70983195"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046130189","display_name":"Dunai Fuentes Hitos","orcid":null},"institutions":[{"id":"https://openalex.org/I78880903","display_name":"Universidad de Huelva","ror":"https://ror.org/03a1kt624","country_code":"ES","type":"education","lineage":["https://openalex.org/I78880903"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Dunai Fuentes Hitos","raw_affiliation_strings":["Independent Researcher, Huelva, Spain"],"affiliations":[{"raw_affiliation_string":"Independent Researcher, Huelva, Spain","institution_ids":["https://openalex.org/I78880903"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5051923415","display_name":"Chilukuri K. Mohan","orcid":"https://orcid.org/0000-0002-6149-6930"},"institutions":[{"id":"https://openalex.org/I70983195","display_name":"Syracuse University","ror":"https://ror.org/025r5qe02","country_code":"US","type":"education","lineage":["https://openalex.org/I70983195"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chilukuri K. Mohan","raw_affiliation_strings":["Department of EECS, Syracuse University, Syracuse, USA"],"affiliations":[{"raw_affiliation_string":"Department of EECS, Syracuse University, Syracuse, USA","institution_ids":["https://openalex.org/I70983195"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5020803752"],"corresponding_institution_ids":["https://openalex.org/I70983195"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.11623911,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9847000241279602,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8145173192024231},{"id":"https://openalex.org/keywords/bigram","display_name":"Bigram","score":0.740686297416687},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.6541503071784973},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.55697101354599},{"id":"https://openalex.org/keywords/obfuscation","display_name":"Obfuscation","score":0.5330979228019714},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5284531116485596},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.5063375234603882},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48477786779403687},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.4820305109024048},{"id":"https://openalex.org/keywords/abstract-syntax-tree","display_name":"Abstract syntax tree","score":0.4308246970176697},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.42538657784461975},{"id":"https://openalex.org/keywords/code-word","display_name":"Code word","score":0.42226776480674744},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.41739022731781006},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3773457109928131},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3587290048599243},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3357129693031311},{"id":"https://openalex.org/keywords/syntax","display_name":"Syntax","score":0.30225270986557007},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.2453402578830719},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.2213842272758484},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.18201029300689697}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8145173192024231},{"id":"https://openalex.org/C108757681","wikidata":"https://www.wikidata.org/wiki/Q2773912","display_name":"Bigram","level":3,"score":0.740686297416687},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.6541503071784973},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.55697101354599},{"id":"https://openalex.org/C40305131","wikidata":"https://www.wikidata.org/wiki/Q2616305","display_name":"Obfuscation","level":2,"score":0.5330979228019714},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5284531116485596},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.5063375234603882},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48477786779403687},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.4820305109024048},{"id":"https://openalex.org/C58646249","wikidata":"https://www.wikidata.org/wiki/Q127380","display_name":"Abstract syntax tree","level":3,"score":0.4308246970176697},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.42538657784461975},{"id":"https://openalex.org/C153207627","wikidata":"https://www.wikidata.org/wiki/Q863873","display_name":"Code word","level":3,"score":0.42226776480674744},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.41739022731781006},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3773457109928131},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3587290048599243},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3357129693031311},{"id":"https://openalex.org/C60048249","wikidata":"https://www.wikidata.org/wiki/Q37437","display_name":"Syntax","level":2,"score":0.30225270986557007},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.2453402578830719},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2213842272758484},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.18201029300689697},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C137546455","wikidata":"https://www.wikidata.org/wiki/Q3213474","display_name":"Trigram","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn48605.2020.9207647","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn48605.2020.9207647","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/17","score":0.4099999964237213,"display_name":"Partnerships for the goals"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W1463623766","https://openalex.org/W1522301498","https://openalex.org/W1574086225","https://openalex.org/W1626975910","https://openalex.org/W1836465849","https://openalex.org/W1970186913","https://openalex.org/W2022524210","https://openalex.org/W2072164438","https://openalex.org/W2095705004","https://openalex.org/W2111227071","https://openalex.org/W2138621090","https://openalex.org/W2151505086","https://openalex.org/W2170770919","https://openalex.org/W2518108298","https://openalex.org/W2564822508","https://openalex.org/W2742956140","https://openalex.org/W2746791238","https://openalex.org/W2762536380","https://openalex.org/W2786672974","https://openalex.org/W2793556064","https://openalex.org/W2895886944","https://openalex.org/W2913408006","https://openalex.org/W2949117887","https://openalex.org/W2951005127","https://openalex.org/W2963263347","https://openalex.org/W2963775347","https://openalex.org/W2964121744","https://openalex.org/W2970971581","https://openalex.org/W2991234496","https://openalex.org/W2995923588","https://openalex.org/W3091905774","https://openalex.org/W4295312788","https://openalex.org/W6631190155","https://openalex.org/W6636546641","https://openalex.org/W6638667902","https://openalex.org/W6674330103","https://openalex.org/W6680272447","https://openalex.org/W6726497184","https://openalex.org/W6731243579","https://openalex.org/W6744628271","https://openalex.org/W6748816842","https://openalex.org/W6766978945","https://openalex.org/W6783596713"],"related_works":["https://openalex.org/W4310447811","https://openalex.org/W4389751695","https://openalex.org/W2165004968","https://openalex.org/W2320787857","https://openalex.org/W2249843248","https://openalex.org/W3086207785","https://openalex.org/W3012064729","https://openalex.org/W2969229669","https://openalex.org/W2955426500","https://openalex.org/W2388254906"],"abstract_inverted_index":{"We":[0,57,68],"tackle":[1],"the":[2,24,83,131,148],"challenge":[3],"of":[4,7,9,20,23,46,87,133,138,155],"Zero-Shot":[5],"identification":[6],"authors":[8,21,143],"source":[10],"code,":[11,163],"which":[12],"can":[13],"be":[14],"used":[15,101],"with":[16],"no":[17],"prior":[18],"samples":[19,112,139],"outside":[22],"training":[25],"data.":[26],"In":[27],"our":[28],"approach,":[29],"a":[30,38,43,136],"feedforward":[31],"neural":[32],"network":[33,48],"is":[34,49],"first":[35],"trained":[36],"on":[37,110,116],"multi-class":[39],"classification":[40],"task.":[41],"Then,":[42],"substantial":[44],"part":[45],"this":[47,60,75],"duplicated":[50],"and":[51,96,157,161],"reused":[52],"to":[53,59,73],"compare":[54],"code":[55,88,111],"samples.":[56,89],"refer":[58],"design":[61],"as":[62],"Feedforward":[63],"Duplicated":[64],"Resolver":[65],"(FDR)":[66],"model.":[67],"propose":[69],"new":[70],"input":[71],"features":[72,91],"train":[74],"model,":[76],"called":[77],"Variable-Independent":[78],"Nested":[79],"Bigrams,":[80],"extracted":[81],"from":[82,113,119,140],"Abstract":[84],"Syntax":[85],"Trees":[86],"These":[90],"provide":[92],"robustness":[93],"against":[94],"lexical":[95],"layout":[97],"obfuscation":[98],"attacks":[99],"frequently":[100],"in":[102],"plagiarism":[103],"attempts.":[104],"This":[105],"approach":[106],"performs":[107],"accurately":[108],"even":[109],"unknown":[114,142],"authors,":[115],"data":[117],"obtained":[118],"Google":[120],"Code":[121],"Jam,":[122],"an":[123,153],"international":[124],"coding":[125],"competition":[126],"platform.":[127],"For":[128],"example,":[129],"for":[130,159],"task":[132],"predicting":[134],"whether":[135],"pair":[137],"43":[141],"have":[144],"been":[145],"written":[146],"by":[147],"same":[149],"person,":[150],"we":[151],"obtain":[152],"AUC":[154],"0.96":[156],"0.91":[158],"non-obfuscated":[160],"obfuscated":[162],"respectively.":[164]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
