{"id":"https://openalex.org/W3033758172","doi":"https://doi.org/10.1145/3341525.3394987","title":"Selection of Code Segments for Exclusion from Code Similarity Detection","display_name":"Selection of Code Segments for Exclusion from Code Similarity Detection","publication_year":2020,"publication_date":"2020-06-03","ids":{"openalex":"https://openalex.org/W3033758172","doi":"https://doi.org/10.1145/3341525.3394987","mag":"3033758172"},"language":"en","primary_location":{"id":"doi:10.1145/3341525.3394987","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3341525.3394987","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2020 ACM Conference on Innovation and Technology in Computer Science Education","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073990695","display_name":"Norma P. Simon","orcid":null},"institutions":[{"id":"https://openalex.org/I2801185773","display_name":"Hunter Water","ror":"https://ror.org/02n5xmn14","country_code":"AU","type":"other","lineage":["https://openalex.org/I2801185773"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Simon","raw_affiliation_strings":["University of Newcastle, Ourimbah, Australia"],"affiliations":[{"raw_affiliation_string":"University of Newcastle, Ourimbah, Australia","institution_ids":["https://openalex.org/I2801185773"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043851929","display_name":"Oscar Karnalim","orcid":"https://orcid.org/0000-0003-4930-6249"},"institutions":[{"id":"https://openalex.org/I2801185773","display_name":"Hunter Water","ror":"https://ror.org/02n5xmn14","country_code":"AU","type":"other","lineage":["https://openalex.org/I2801185773"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Oscar Karnalim","raw_affiliation_strings":["University of Newcastle, Ourimbah, Australia"],"affiliations":[{"raw_affiliation_string":"University of Newcastle, Ourimbah, Australia","institution_ids":["https://openalex.org/I2801185773"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022993892","display_name":"Judy Sheard","orcid":"https://orcid.org/0000-0002-4179-8149"},"institutions":[{"id":"https://openalex.org/I56590836","display_name":"Monash University","ror":"https://ror.org/02bfwt286","country_code":"AU","type":"education","lineage":["https://openalex.org/I56590836"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Judy Sheard","raw_affiliation_strings":["Monash University, Melbourne, VIC, Australia"],"affiliations":[{"raw_affiliation_string":"Monash University, Melbourne, VIC, Australia","institution_ids":["https://openalex.org/I56590836"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042306223","display_name":"Ilir Dema","orcid":null},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Ilir Dema","raw_affiliation_strings":["University of Toronto, Mississauga, ON, Canada"],"affiliations":[{"raw_affiliation_string":"University of Toronto, Mississauga, ON, Canada","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032981748","display_name":"Amey Karkare","orcid":"https://orcid.org/0000-0002-3664-6490"},"institutions":[{"id":"https://openalex.org/I94234084","display_name":"Indian Institute of Technology Kanpur","ror":"https://ror.org/05pjsgx75","country_code":"IN","type":"education","lineage":["https://openalex.org/I94234084"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Amey Karkare","raw_affiliation_strings":["Indian Institute of Technology, Kanpur, India"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology, Kanpur, India","institution_ids":["https://openalex.org/I94234084"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041367899","display_name":"Juho Leinonen","orcid":"https://orcid.org/0000-0001-6829-9449"},"institutions":[{"id":"https://openalex.org/I133731052","display_name":"University of Helsinki","ror":"https://ror.org/040af2s02","country_code":"FI","type":"education","lineage":["https://openalex.org/I133731052"]}],"countries":["FI"],"is_corresponding":false,"raw_author_name":"Juho Leinonen","raw_affiliation_strings":["University of Helsinki, Helsinki, Finland"],"affiliations":[{"raw_affiliation_string":"University of Helsinki, Helsinki, Finland","institution_ids":["https://openalex.org/I133731052"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017029944","display_name":"Michael Liut","orcid":"https://orcid.org/0000-0003-2965-5302"},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Michael Liut","raw_affiliation_strings":["University of Toronto, Mississauga, ON, Canada"],"affiliations":[{"raw_affiliation_string":"University of Toronto, Mississauga, ON, Canada","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002274479","display_name":"Ren\u00e9e McCauley","orcid":"https://orcid.org/0000-0003-2035-9160"},"institutions":[{"id":"https://openalex.org/I204593131","display_name":"College of Charleston","ror":"https://ror.org/00390t168","country_code":"US","type":"education","lineage":["https://openalex.org/I204593131"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Renee McCauley","raw_affiliation_strings":["College of Charleston, Charleston, SC, USA"],"affiliations":[{"raw_affiliation_string":"College of Charleston, Charleston, SC, USA","institution_ids":["https://openalex.org/I204593131"]}]}],"institutions":[],"countries_distinct_count":5,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5073990695"],"corresponding_institution_ids":["https://openalex.org/I2801185773"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.08219627,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"56","issue":null,"first_page":"500","last_page":"501"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11492","display_name":"Academic integrity and plagiarism","score":0.9858999848365784,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9771000146865845,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7890685200691223},{"id":"https://openalex.org/keywords/code-review","display_name":"Code review","score":0.5898748636245728},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5856279730796814},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.5724480748176575},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.543871283531189},{"id":"https://openalex.org/keywords/boilerplate-text","display_name":"Boilerplate text","score":0.5121290683746338},{"id":"https://openalex.org/keywords/sort","display_name":"sort","score":0.48076722025871277},{"id":"https://openalex.org/keywords/code-smell","display_name":"Code smell","score":0.47590741515159607},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4424659311771393},{"id":"https://openalex.org/keywords/string-metric","display_name":"String metric","score":0.41368094086647034},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.41243401169776917},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3300181031227112},{"id":"https://openalex.org/keywords/static-program-analysis","display_name":"Static program analysis","score":0.32314521074295044},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.22930222749710083},{"id":"https://openalex.org/keywords/string-searching-algorithm","display_name":"String searching algorithm","score":0.22678616642951965},{"id":"https://openalex.org/keywords/pattern-matching","display_name":"Pattern matching","score":0.22225803136825562},{"id":"https://openalex.org/keywords/software-quality","display_name":"Software quality","score":0.08883845806121826},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.08432045578956604},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.08000591397285461},{"id":"https://openalex.org/keywords/software-development","display_name":"Software development","score":0.07773041725158691}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7890685200691223},{"id":"https://openalex.org/C150292731","wikidata":"https://www.wikidata.org/wiki/Q1342704","display_name":"Code review","level":5,"score":0.5898748636245728},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5856279730796814},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.5724480748176575},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.543871283531189},{"id":"https://openalex.org/C75701414","wikidata":"https://www.wikidata.org/wiki/Q1651672","display_name":"Boilerplate text","level":2,"score":0.5121290683746338},{"id":"https://openalex.org/C88548561","wikidata":"https://www.wikidata.org/wiki/Q347599","display_name":"sort","level":2,"score":0.48076722025871277},{"id":"https://openalex.org/C133237599","wikidata":"https://www.wikidata.org/wiki/Q2295111","display_name":"Code smell","level":5,"score":0.47590741515159607},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4424659311771393},{"id":"https://openalex.org/C22820288","wikidata":"https://www.wikidata.org/wiki/Q9050568","display_name":"String metric","level":4,"score":0.41368094086647034},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.41243401169776917},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3300181031227112},{"id":"https://openalex.org/C137287247","wikidata":"https://www.wikidata.org/wiki/Q1329550","display_name":"Static program analysis","level":4,"score":0.32314521074295044},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.22930222749710083},{"id":"https://openalex.org/C7757238","wikidata":"https://www.wikidata.org/wiki/Q374040","display_name":"String searching algorithm","level":3,"score":0.22678616642951965},{"id":"https://openalex.org/C68859911","wikidata":"https://www.wikidata.org/wiki/Q1503724","display_name":"Pattern matching","level":2,"score":0.22225803136825562},{"id":"https://openalex.org/C117447612","wikidata":"https://www.wikidata.org/wiki/Q1412670","display_name":"Software quality","level":4,"score":0.08883845806121826},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.08432045578956604},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.08000591397285461},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.07773041725158691},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3341525.3394987","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3341525.3394987","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2020 ACM Conference on Innovation and Technology in Computer Science Education","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.4099999964237213,"id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W2024438214","https://openalex.org/W2111295912","https://openalex.org/W2132239106","https://openalex.org/W2146659255","https://openalex.org/W2148484595","https://openalex.org/W2155056246","https://openalex.org/W2346364124","https://openalex.org/W2368366855","https://openalex.org/W4292014584","https://openalex.org/W6681648988"],"related_works":["https://openalex.org/W3175279244","https://openalex.org/W3137757622","https://openalex.org/W2083714857","https://openalex.org/W4382562158","https://openalex.org/W2896744621","https://openalex.org/W4384026574","https://openalex.org/W2150625980","https://openalex.org/W1982871693","https://openalex.org/W4285737963","https://openalex.org/W2338725043"],"abstract_inverted_index":{"When":[0],"student":[1,71],"programs":[2],"are":[3,11,21],"compared":[4],"for":[5,173],"similarity,":[6],"certain":[7],"segments":[8,20],"of":[9,18,48,54,93,123,130,164,167],"code":[10,23,40,63,144,151,168],"always":[12],"sure":[13],"to":[14,44,59,66,137,142,160,171],"be":[15,39,67,76,147],"similar.":[16],"Some":[17],"these":[19,115],"boilerplate":[22],"--":[24,35],"public":[25],"static":[26],"void":[27],"main":[28],"String":[29],"[]":[30],"args":[31],"and":[32,36,73,89,110,180],"the":[33,49],"like":[34],"some":[37],"will":[38,83,99,117],"that":[41,114,184],"was":[42],"provided":[43],"students":[45,174],"as":[46,141],"part":[47],"assessment":[50,94,101,124],"specification.":[51],"The":[52,81,133],"purpose":[53],"this":[55],"working":[56,134],"group":[57,97,135],"is":[58,64,112],"explore":[60],"what":[61,143,165],"other":[62],"expected":[65],"reasonably":[68,146],"common":[69],"in":[70,126,154],"assessments,":[72],"should":[74],"therefore":[75],"excluded":[77,148],"from":[78,103,149],"similarity":[79,152],"checking.":[80],"answers":[82],"clearly":[84],"vary":[85],"with":[86,91],"programming":[87,131],"language,":[88],"perhaps":[90],"level":[92],"item.":[95],"Working":[96],"members":[98],"collect":[100],"submissions":[102,116],"their":[104,107],"own":[105],"or":[106],"colleagues'":[108],"students,":[109],"it":[111],"hoped":[113],"together":[118],"encompass":[119],"a":[120,127,162],"wide":[121,128],"variety":[122,129],"tasks":[125],"languages.":[132],"aims":[136,159],"deliver":[138,161],"clear":[139],"guidelines":[140],"can":[145],"automatic":[150],"detection":[153],"various":[155],"circumstances.":[156],"It":[157],"also":[158],"summary":[163],"sort":[166],"lecturers":[169],"tend":[170],"provide":[172,183],"when":[175],"setting":[176],"an":[177],"assigned":[178],"task,":[179],"why":[181],"they":[182],"code.":[185]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
