{"id":"https://openalex.org/W4298841214","doi":"https://doi.org/10.1145/2889160.2889165","title":"SourcererCC and SourcererCC-I","display_name":"SourcererCC and SourcererCC-I","publication_year":2016,"publication_date":"2016-05-14","ids":{"openalex":"https://openalex.org/W4298841214","doi":"https://doi.org/10.1145/2889160.2889165"},"language":"en","primary_location":{"id":"doi:10.1145/2889160.2889165","is_oa":true,"landing_page_url":"https://doi.org/10.1145/2889160.2889165","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/2889160.2889165","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 38th International Conference on Software Engineering Companion","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/2889160.2889165","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101846745","display_name":"Vaibhav Saini","orcid":"https://orcid.org/0000-0002-6107-9504"},"institutions":[{"id":"https://openalex.org/I204250578","display_name":"University of California, Irvine","ror":"https://ror.org/04gyf1771","country_code":"US","type":"education","lineage":["https://openalex.org/I204250578"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vaibhav Saini","raw_affiliation_strings":["University of California, Irvine, CA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California, Irvine, CA","institution_ids":["https://openalex.org/I204250578"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015641612","display_name":"Hitesh Sajnani","orcid":"https://orcid.org/0009-0004-9973-6241"},"institutions":[{"id":"https://openalex.org/I204250578","display_name":"University of California, Irvine","ror":"https://ror.org/04gyf1771","country_code":"US","type":"education","lineage":["https://openalex.org/I204250578"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hitesh Sajnani","raw_affiliation_strings":["University of California, Irvine, CA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California, Irvine, CA","institution_ids":["https://openalex.org/I204250578"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100720873","display_name":"Jae-Woo Kim","orcid":"https://orcid.org/0000-0002-2622-4219"},"institutions":[{"id":"https://openalex.org/I204250578","display_name":"University of California, Irvine","ror":"https://ror.org/04gyf1771","country_code":"US","type":"education","lineage":["https://openalex.org/I204250578"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jaewoo Kim","raw_affiliation_strings":["University of California, Irvine, CA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California, Irvine, CA","institution_ids":["https://openalex.org/I204250578"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103284742","display_name":"Cristina Videira Lopes","orcid":"https://orcid.org/0000-0003-0551-3908"},"institutions":[{"id":"https://openalex.org/I204250578","display_name":"University of California, Irvine","ror":"https://ror.org/04gyf1771","country_code":"US","type":"education","lineage":["https://openalex.org/I204250578"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Cristina Lopes","raw_affiliation_strings":["University of California, Irvine, CA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California, Irvine, CA","institution_ids":["https://openalex.org/I204250578"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.8325,"has_fulltext":true,"cited_by_count":20,"citation_normalized_percentile":{"value":0.95667387,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"597","last_page":"600"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.790460467338562},{"id":"https://openalex.org/keywords/clone","display_name":"clone (Java method)","score":0.7206382751464844},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.6845276355743408},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5855411887168884},{"id":"https://openalex.org/keywords/workstation","display_name":"Workstation","score":0.522512674331665},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.49198243021965027},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.4634333550930023},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.45971181988716125},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4572259485721588},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.4444173574447632},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.43345117568969727},{"id":"https://openalex.org/keywords/inverted-index","display_name":"Inverted index","score":0.4202282726764679},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.3266260325908661},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.2801537811756134},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.1965898871421814},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.1585974097251892},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.10398778319358826}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.790460467338562},{"id":"https://openalex.org/C81089528","wikidata":"https://www.wikidata.org/wiki/Q5134986","display_name":"clone (Java method)","level":3,"score":0.7206382751464844},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.6845276355743408},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5855411887168884},{"id":"https://openalex.org/C67953723","wikidata":"https://www.wikidata.org/wiki/Q192525","display_name":"Workstation","level":2,"score":0.522512674331665},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.49198243021965027},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.4634333550930023},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.45971181988716125},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4572259485721588},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.4444173574447632},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.43345117568969727},{"id":"https://openalex.org/C130590232","wikidata":"https://www.wikidata.org/wiki/Q1671754","display_name":"Inverted index","level":3,"score":0.4202282726764679},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.3266260325908661},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2801537811756134},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.1965898871421814},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.1585974097251892},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.10398778319358826},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C552990157","wikidata":"https://www.wikidata.org/wiki/Q7430","display_name":"DNA","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2889160.2889165","is_oa":true,"landing_page_url":"https://doi.org/10.1145/2889160.2889165","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/2889160.2889165","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 38th International Conference on Software Engineering Companion","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/2889160.2889165","is_oa":true,"landing_page_url":"https://doi.org/10.1145/2889160.2889165","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/2889160.2889165","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 38th International Conference on Software Engineering Companion","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7060254769","display_name":null,"funder_award_id":"1218228","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4298841214.pdf","grobid_xml":"https://content.openalex.org/works/W4298841214.grobid-xml"},"referenced_works_count":24,"referenced_works":["https://openalex.org/W1567790484","https://openalex.org/W1972466226","https://openalex.org/W1983316175","https://openalex.org/W2020867825","https://openalex.org/W2065622239","https://openalex.org/W2088211982","https://openalex.org/W2088479623","https://openalex.org/W2101606071","https://openalex.org/W2101832700","https://openalex.org/W2109943392","https://openalex.org/W2115534035","https://openalex.org/W2120326119","https://openalex.org/W2122257083","https://openalex.org/W2124173249","https://openalex.org/W2134852596","https://openalex.org/W2138756793","https://openalex.org/W2144886241","https://openalex.org/W2161276236","https://openalex.org/W2165739648","https://openalex.org/W2165879825","https://openalex.org/W2172244770","https://openalex.org/W3132670815","https://openalex.org/W4301168982","https://openalex.org/W4386707048"],"related_works":["https://openalex.org/W2377327490","https://openalex.org/W2045348955","https://openalex.org/W2352028719","https://openalex.org/W2584886384","https://openalex.org/W2378667902","https://openalex.org/W2124379162","https://openalex.org/W2560253012","https://openalex.org/W2791088446","https://openalex.org/W4388335561","https://openalex.org/W2001919569"],"abstract_inverted_index":{"Given":[0],"the":[1,58],"availability":[2],"of":[3,13,23],"large":[4,11,41],"source-code":[5],"repositories,":[6,42],"there":[7,26],"has":[8],"been":[9],"a":[10,21,28],"number":[12],"applications":[14],"for":[15,44],"large-scale":[16],"clone":[17,32],"detection.":[18],"Unfortunately,":[19],"despite":[20],"decade":[22],"active":[24],"research,":[25],"is":[27],"marked":[29],"lack":[30],"in":[31,57],"detectors":[33],"that":[34],"scale":[35],"to":[36],"big":[37],"software":[38],"systems":[39],"or":[40],"specifically":[43],"detecting":[45],"near-miss":[46],"(Type":[47],"3)":[48],"clones":[49],"where":[50],"significant":[51],"editing":[52],"activities":[53],"may":[54],"take":[55],"place":[56],"cloned":[59],"code.":[60]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2022-10-02T00:00:00"}
