{"id":"https://openalex.org/W4394746213","doi":"https://doi.org/10.1145/3597503.3639215","title":"DSFM: Enhancing Functional Code Clone Detection with Deep Subtree Interactions","display_name":"DSFM: Enhancing Functional Code Clone Detection with Deep Subtree Interactions","publication_year":2024,"publication_date":"2024-04-12","ids":{"openalex":"https://openalex.org/W4394746213","doi":"https://doi.org/10.1145/3597503.3639215"},"language":"en","primary_location":{"id":"doi:10.1145/3597503.3639215","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3597503.3639215","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3597503.3639215","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the IEEE/ACM 46th International Conference on Software Engineering","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3597503.3639215","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101756705","display_name":"Zhiwei Xu","orcid":"https://orcid.org/0000-0003-4430-3727"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhiwei Xu","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095377110","display_name":"Shaohua Qiang","orcid":"https://orcid.org/0009-0008-7945-7543"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shaohua Qiang","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015685769","display_name":"D. Song","orcid":"https://orcid.org/0009-0002-2700-2359"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dinghong Song","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071579968","display_name":"Min Zhou","orcid":"https://orcid.org/0000-0002-4679-0488"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Min Zhou","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073617379","display_name":"Hai Wan","orcid":"https://orcid.org/0000-0002-9608-5808"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hai Wan","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100773043","display_name":"Xibin Zhao","orcid":"https://orcid.org/0000-0002-6168-7016"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xibin Zhao","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057157090","display_name":"Ping Luo","orcid":"https://orcid.org/0000-0001-6171-3811"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ping Luo","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100412598","display_name":"Hongyu Zhang","orcid":"https://orcid.org/0000-0002-3063-9425"},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongyu Zhang","raw_affiliation_strings":["Chongqing University, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"Chongqing University, Chongqing, China","institution_ids":["https://openalex.org/I158842170"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5101756705"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":5.2683,"has_fulltext":true,"cited_by_count":7,"citation_normalized_percentile":{"value":0.95482016,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"12"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.9912999868392944,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12423","display_name":"Software Reliability and Analysis Research","score":0.9710000157356262,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/snippet","display_name":"Snippet","score":0.8573318123817444},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8205610513687134},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.6326368451118469},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6234493851661682},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.6067200899124146},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.5870523452758789},{"id":"https://openalex.org/keywords/syntax","display_name":"Syntax","score":0.4766831398010254},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.43593528866767883},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.41752636432647705},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3431134521961212},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.33476102352142334}],"concepts":[{"id":"https://openalex.org/C2777822670","wikidata":"https://www.wikidata.org/wiki/Q1120538","display_name":"Snippet","level":2,"score":0.8573318123817444},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8205610513687134},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.6326368451118469},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6234493851661682},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.6067200899124146},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.5870523452758789},{"id":"https://openalex.org/C60048249","wikidata":"https://www.wikidata.org/wiki/Q37437","display_name":"Syntax","level":2,"score":0.4766831398010254},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.43593528866767883},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.41752636432647705},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3431134521961212},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33476102352142334},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3597503.3639215","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3597503.3639215","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3597503.3639215","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the IEEE/ACM 46th International Conference on Software Engineering","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3597503.3639215","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3597503.3639215","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3597503.3639215","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the IEEE/ACM 46th International Conference on Software Engineering","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1100049447","display_name":null,"funder_award_id":"6212780016","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1151522064","display_name":null,"funder_award_id":"U19A2","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2021969373","display_name":null,"funder_award_id":"92267203","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G391238517","display_name":null,"funder_award_id":", and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4020255992","display_name":null,"funder_award_id":"Project","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4543866928","display_name":null,"funder_award_id":"2022YFB3103903","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G4796153733","display_name":null,"funder_award_id":"6202100","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5075807795","display_name":null,"funder_award_id":"U19A2062","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5517038434","display_name":null,"funder_award_id":"2020YFB","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G5618013222","display_name":null,"funder_award_id":"U1911401","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G5939423041","display_name":null,"funder_award_id":"Technology","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6058138561","display_name":null,"funder_award_id":", No.","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6127069372","display_name":null,"funder_award_id":"U20A600","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7091651887","display_name":null,"funder_award_id":"62021002","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G760460541","display_name":null,"funder_award_id":"62076146","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8356187857","display_name":null,"funder_award_id":"U20A6003","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8862684424","display_name":null,"funder_award_id":"2020YFB1707700","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320323970","display_name":"Ministry of Industry and Information Technology of the People's Republic of China","ror":"https://ror.org/0385nmy68"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4394746213.pdf","grobid_xml":"https://content.openalex.org/works/W4394746213.grobid-xml"},"referenced_works_count":55,"referenced_works":["https://openalex.org/W1771830246","https://openalex.org/W1902237438","https://openalex.org/W2064675550","https://openalex.org/W2065053490","https://openalex.org/W2079887492","https://openalex.org/W2101832700","https://openalex.org/W2104301886","https://openalex.org/W2128782367","https://openalex.org/W2128888088","https://openalex.org/W2138756793","https://openalex.org/W2157331557","https://openalex.org/W2157532207","https://openalex.org/W2282866165","https://openalex.org/W2295739661","https://openalex.org/W2298313545","https://openalex.org/W2344444819","https://openalex.org/W2511803001","https://openalex.org/W2634106992","https://openalex.org/W2726916722","https://openalex.org/W2728599219","https://openalex.org/W2741705590","https://openalex.org/W2788728386","https://openalex.org/W2789876780","https://openalex.org/W2794744252","https://openalex.org/W2807866521","https://openalex.org/W2887364112","https://openalex.org/W2891488835","https://openalex.org/W2899171197","https://openalex.org/W2904067867","https://openalex.org/W2937836435","https://openalex.org/W2954552517","https://openalex.org/W2955426500","https://openalex.org/W2963323306","https://openalex.org/W2963355447","https://openalex.org/W2964150020","https://openalex.org/W2993743533","https://openalex.org/W3014339000","https://openalex.org/W3043078865","https://openalex.org/W3045279034","https://openalex.org/W3045334720","https://openalex.org/W3104991709","https://openalex.org/W3105535951","https://openalex.org/W3124675547","https://openalex.org/W3125205154","https://openalex.org/W3125675786","https://openalex.org/W3126095862","https://openalex.org/W3162904859","https://openalex.org/W3162962341","https://openalex.org/W3196992070","https://openalex.org/W3212083716","https://openalex.org/W4285280217","https://openalex.org/W4287591147","https://openalex.org/W4301168982","https://openalex.org/W4312354494","https://openalex.org/W4389158355"],"related_works":["https://openalex.org/W1607713096","https://openalex.org/W3036724449","https://openalex.org/W2798329462","https://openalex.org/W1511521437","https://openalex.org/W3201315194","https://openalex.org/W4318980730","https://openalex.org/W4289376745","https://openalex.org/W4384811727","https://openalex.org/W3081644756","https://openalex.org/W4231058664"],"abstract_inverted_index":{"Functional":[0],"code":[1,23,29,54,65,87,100,113,131,136,162,192],"clone":[2,24,88,144,193],"detection":[3,194],"is":[4],"important":[5],"for":[6,133],"software":[7],"maintenance.":[8],"In":[9,115],"recent":[10],"years,":[11],"deep":[12,46,75,122,143,147,188,212],"learning":[13],"techniques":[14],"are":[15,42],"introduced":[16],"to":[17,53,58,93,111],"improve":[18,140],"the":[19,83,95,98,141,184,200],"performance":[20],"of":[21,63,85,97,103,160,187],"functional":[22,40,135],"detectors.":[25],"By":[26,170],"representing":[27],"each":[28],"snippet":[30,66],"as":[31],"a":[32,64,68,120],"vector":[33],"containing":[34],"its":[35],"program":[36],"semantics,":[37],"syntactically":[38],"dissimilar":[39],"clones":[41],"detected.":[43],"However,":[44],"existing":[45],"learning-based":[47,76,123,213],"approaches":[48,77],"attach":[49],"too":[50],"much":[51],"importance":[52],"feature":[55],"learning,":[56],"hoping":[57],"project":[59],"all":[60],"recognizable":[61],"knowledge":[62],"into":[67],"single":[69],"vector.":[70],"We":[71],"argue":[72],"that":[73,150],"these":[74],"can":[78],"be":[79],"enhanced":[80],"by":[81],"considering":[82],"characteristics":[84],"syntactic":[86],"detection,":[89],"where":[90],"we":[91,118,139,182],"need":[92],"compare":[94,151],"contents":[96],"source":[99],"(e.g.,":[101],"intersection":[102],"tokens,":[104],"similar":[105,109],"flow":[106],"graphs,":[107],"and":[108,180,209],"subtrees)":[110],"obtain":[112],"clones.":[114,137],"this":[116],"paper,":[117],"propose":[119],"novel":[121],"approach":[124],"named":[125],"DSFM,":[126],"which":[127],"incorporates":[128],"comparisons":[129],"between":[130],"snippets":[132],"detecting":[134],"Specifically,":[138],"typical":[142],"detectors":[145],"with":[146],"subtree":[148,189],"interactions":[149,190],"every":[152],"two":[153,161,204,207],"subtrees":[154],"extracted":[155],"abstract":[156],"syntax":[157],"trees":[158],"(ASTs)":[159],"snippets,":[163],"thereby":[164],"introducing":[165],"more":[166],"fine-grained":[167],"semantic":[168],"similarity.":[169],"conducting":[171],"extensive":[172],"experiments":[173],"on":[174],"three":[175],"widely-used":[176],"datasets,":[177],"GCJ,":[178],"OJClone,":[179],"BigCloneBench,":[181],"demonstrate":[183],"great":[185],"potential":[186],"in":[191],"task.":[195],"The":[196],"proposed":[197],"DSFM":[198],"outperforms":[199],"state-of-the-art":[201],"approaches,":[202,206],"including":[203],"traditional":[205],"unsupervised":[208],"four":[210],"supervised":[211],"baselines.":[214]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":1}],"updated_date":"2026-04-18T07:56:08.524223","created_date":"2025-10-10T00:00:00"}
