{"id":"https://openalex.org/W1998549095","doi":"https://doi.org/10.1145/2635868.2635886","title":"How should we measure functional sameness from program source code? an exploratory study on Java methods","display_name":"How should we measure functional sameness from program source code? an exploratory study on Java methods","publication_year":2014,"publication_date":"2014-11-04","ids":{"openalex":"https://openalex.org/W1998549095","doi":"https://doi.org/10.1145/2635868.2635886","mag":"1998549095"},"language":"en","primary_location":{"id":"doi:10.1145/2635868.2635886","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2635868.2635886","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd ACM SIGSOFT International Symposium on Foundations of Software Engineering","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024065727","display_name":"Yoshiki Higo","orcid":"https://orcid.org/0000-0002-8278-8975"},"institutions":[{"id":"https://openalex.org/I98285908","display_name":"Osaka University","ror":"https://ror.org/035t8zc32","country_code":"JP","type":"education","lineage":["https://openalex.org/I98285908"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Yoshiki Higo","raw_affiliation_strings":["Osaka University, Japan","[Osaka University,Japan]"],"affiliations":[{"raw_affiliation_string":"Osaka University, Japan","institution_ids":["https://openalex.org/I98285908"]},{"raw_affiliation_string":"[Osaka University,Japan]","institution_ids":["https://openalex.org/I98285908"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5109843671","display_name":"Shinji Kusumoto","orcid":null},"institutions":[{"id":"https://openalex.org/I98285908","display_name":"Osaka University","ror":"https://ror.org/035t8zc32","country_code":"JP","type":"education","lineage":["https://openalex.org/I98285908"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Shinji Kusumoto","raw_affiliation_strings":["Osaka University, Japan","[Osaka University,Japan]"],"affiliations":[{"raw_affiliation_string":"Osaka University, Japan","institution_ids":["https://openalex.org/I98285908"]},{"raw_affiliation_string":"[Osaka University,Japan]","institution_ids":["https://openalex.org/I98285908"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5024065727"],"corresponding_institution_ids":["https://openalex.org/I98285908"],"apc_list":null,"apc_paid":null,"fwci":6.3113,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.9608568,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"294","last_page":"305"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12423","display_name":"Software Reliability and Analysis Research","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.9908000230789185,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7911053895950317},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.6464026570320129},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.6053655743598938},{"id":"https://openalex.org/keywords/false-positive-paradox","display_name":"False positive paradox","score":0.5914483666419983},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.5844435095787048},{"id":"https://openalex.org/keywords/java","display_name":"Java","score":0.5392178297042847},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.48040297627449036},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.45535069704055786},{"id":"https://openalex.org/keywords/kpi-driven-code-analysis","display_name":"KPI-driven code analysis","score":0.4388338029384613},{"id":"https://openalex.org/keywords/empirical-research","display_name":"Empirical research","score":0.4353299140930176},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.40031591057777405},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3861524760723114},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.35456180572509766},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3508598208427429},{"id":"https://openalex.org/keywords/static-program-analysis","display_name":"Static program analysis","score":0.28585416078567505},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.27809804677963257},{"id":"https://openalex.org/keywords/software-development","display_name":"Software development","score":0.19065147638320923},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10756149888038635},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.10729151964187622},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.09517788887023926},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.08431467413902283}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7911053895950317},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.6464026570320129},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.6053655743598938},{"id":"https://openalex.org/C64869954","wikidata":"https://www.wikidata.org/wiki/Q1859747","display_name":"False positive paradox","level":2,"score":0.5914483666419983},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.5844435095787048},{"id":"https://openalex.org/C548217200","wikidata":"https://www.wikidata.org/wiki/Q251","display_name":"Java","level":2,"score":0.5392178297042847},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.48040297627449036},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.45535069704055786},{"id":"https://openalex.org/C121957198","wikidata":"https://www.wikidata.org/wiki/Q14365593","display_name":"KPI-driven code analysis","level":5,"score":0.4388338029384613},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.4353299140930176},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.40031591057777405},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3861524760723114},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.35456180572509766},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3508598208427429},{"id":"https://openalex.org/C137287247","wikidata":"https://www.wikidata.org/wiki/Q1329550","display_name":"Static program analysis","level":4,"score":0.28585416078567505},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.27809804677963257},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.19065147638320923},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10756149888038635},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.10729151964187622},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.09517788887023926},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.08431467413902283},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2635868.2635886","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2635868.2635886","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd ACM SIGSOFT International Symposium on Foundations of Software Engineering","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":54,"referenced_works":["https://openalex.org/W1565377632","https://openalex.org/W1593203335","https://openalex.org/W1598423581","https://openalex.org/W1698439592","https://openalex.org/W1938740620","https://openalex.org/W1969191237","https://openalex.org/W1974583579","https://openalex.org/W1977657402","https://openalex.org/W1983118588","https://openalex.org/W1983316175","https://openalex.org/W1984565341","https://openalex.org/W1986541713","https://openalex.org/W1995986391","https://openalex.org/W2037712120","https://openalex.org/W2041190309","https://openalex.org/W2050396504","https://openalex.org/W2056830820","https://openalex.org/W2065622239","https://openalex.org/W2079136077","https://openalex.org/W2081576997","https://openalex.org/W2084595165","https://openalex.org/W2096491586","https://openalex.org/W2097001189","https://openalex.org/W2099969795","https://openalex.org/W2101832700","https://openalex.org/W2105371533","https://openalex.org/W2111643214","https://openalex.org/W2117508687","https://openalex.org/W2119301379","https://openalex.org/W2120322286","https://openalex.org/W2123551785","https://openalex.org/W2124378517","https://openalex.org/W2125681959","https://openalex.org/W2128888088","https://openalex.org/W2135530488","https://openalex.org/W2136294183","https://openalex.org/W2138756793","https://openalex.org/W2141164043","https://openalex.org/W2151951885","https://openalex.org/W2152908881","https://openalex.org/W2153887189","https://openalex.org/W2154027310","https://openalex.org/W2158864412","https://openalex.org/W2164233915","https://openalex.org/W2165739648","https://openalex.org/W2170196926","https://openalex.org/W2170460608","https://openalex.org/W2172244770","https://openalex.org/W2294554540","https://openalex.org/W2482589566","https://openalex.org/W2787379525","https://openalex.org/W2915705208","https://openalex.org/W6640911648","https://openalex.org/W6683106902"],"related_works":["https://openalex.org/W4308823623","https://openalex.org/W2904997879","https://openalex.org/W2019168903","https://openalex.org/W2390085541","https://openalex.org/W1990888989","https://openalex.org/W2149598945","https://openalex.org/W2316077753","https://openalex.org/W656101134","https://openalex.org/W2332490499","https://openalex.org/W377327559"],"abstract_inverted_index":{"Program":[0],"source":[1,22,41],"code":[2,166,220],"is":[3,221],"one":[4],"of":[5,9,16,40,82,113,138,237],"the":[6,37,70,75,79,94,117,144,176,228,238],"main":[7],"targets":[8],"software":[10],"engineering":[11],"research.":[12],"A":[13],"wide":[14],"variety":[15],"research":[17],"has":[18],"been":[19],"conducted":[20,47],"on":[21],"code,":[23,186],"and":[24,31,68,157],"many":[25,189,236],"studies":[26],"have":[27],"leveraged":[28],"structural,":[29],"vocabulary,":[30],"method":[32,76,89,225,233],"signature":[33],"similarities":[34,58,72,96],"to":[35,51,59,99,106,148,207,216],"measure":[36,60],"functional":[38,61],"sameness":[39],"code.":[42,110,130,152],"In":[43,175],"this":[44],"research,":[45],"we":[46,54,102,178,187,193],"an":[48],"empirical":[49],"study":[50,115],"ascertain":[52],"how":[53,101],"should":[55,103],"use":[56,104,179,235],"three":[57,71,95],"sameness.":[62],"We":[63],"used":[64],"two":[65],"large":[66],"datasets":[67],"measured":[69],"between":[73,93,171],"all":[74],"pairs":[77,226,234],"in":[78,205,227],"datasets,":[80],"each":[81,105],"which":[83],"included":[84],"approximately":[85],"15":[86],"million":[87],"Java":[88],"pairs.":[90],"The":[91,111],"relationships":[92],"were":[97],"analyzed":[98],"determine":[100],"detect":[107,217],"functionally":[108,128,150,164,184,218],"similar":[109,129,151,165,185,219],"results":[112],"our":[114],"revealed":[116],"following.":[118],"(1)":[119],"Method":[120],"names":[121],"are":[122,134,146],"not":[123,222],"always":[124],"useful":[125],"for":[126,182,224],"detecting":[127,183,196],"Only":[131],"if":[132],"there":[133],"a":[135,141,202,208,213],"small":[136],"number":[137],"methods":[139,145,245],"having":[140],"given":[142],"name,":[143],"likely":[147],"include":[149],"(2)":[153],"Existing":[154],"file-level,":[155],"method-level,":[156],"block-level":[158],"clone":[159],"detection":[160],"techniques":[161],"often":[162],"miss":[163],"generated":[167],"by":[168,200],"copy-and-paste":[169],"operations":[170],"different":[172],"projects.":[173],"(3)":[174],"cases":[177],"structural":[180,209],"similarity":[181,204,215],"obtained":[188],"false":[190,198],"positives.":[191],"However,":[192],"can":[194],"avoid":[195],"most":[197],"positives":[199],"using":[201],"vocabulary":[203,214],"addition":[206],"one.":[210],"(4)":[211],"Using":[212],"suitable":[223],"same":[229,239],"file":[230],"because":[231],"such":[232,242],"program":[240],"elements":[241],"as":[243],"private":[244,247],"or":[246],"fields.":[248]},"counts_by_year":[{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
