{"id":"https://openalex.org/W4313185449","doi":"https://doi.org/10.1145/3524610.3527909","title":"Semantic similarity metrics for evaluating source code summarization","display_name":"Semantic similarity metrics for evaluating source code summarization","publication_year":2022,"publication_date":"2022-05-16","ids":{"openalex":"https://openalex.org/W4313185449","doi":"https://doi.org/10.1145/3524610.3527909"},"language":"en","primary_location":{"id":"doi:10.1145/3524610.3527909","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3524610.3527909","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3524610.3527909","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th IEEE/ACM International Conference on Program Comprehension","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3524610.3527909","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019604003","display_name":"Sakib Haque","orcid":null},"institutions":[{"id":"https://openalex.org/I107639228","display_name":"University of Notre Dame","ror":"https://ror.org/00mkhxb43","country_code":"US","type":"education","lineage":["https://openalex.org/I107639228"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sakib Haque","raw_affiliation_strings":["University of Notre Dame"],"affiliations":[{"raw_affiliation_string":"University of Notre Dame","institution_ids":["https://openalex.org/I107639228"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043366284","display_name":"Zachary Eberhart","orcid":"https://orcid.org/0000-0003-0725-5009"},"institutions":[{"id":"https://openalex.org/I107639228","display_name":"University of Notre Dame","ror":"https://ror.org/00mkhxb43","country_code":"US","type":"education","lineage":["https://openalex.org/I107639228"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zachary Eberhart","raw_affiliation_strings":["University of Notre Dame"],"affiliations":[{"raw_affiliation_string":"University of Notre Dame","institution_ids":["https://openalex.org/I107639228"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006683167","display_name":"Aakash Bansal","orcid":"https://orcid.org/0000-0001-7475-7899"},"institutions":[{"id":"https://openalex.org/I107639228","display_name":"University of Notre Dame","ror":"https://ror.org/00mkhxb43","country_code":"US","type":"education","lineage":["https://openalex.org/I107639228"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aakash Bansal","raw_affiliation_strings":["University of Notre Dame"],"affiliations":[{"raw_affiliation_string":"University of Notre Dame","institution_ids":["https://openalex.org/I107639228"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5084874990","display_name":"Collin McMillan","orcid":"https://orcid.org/0009-0005-0887-1083"},"institutions":[{"id":"https://openalex.org/I107639228","display_name":"University of Notre Dame","ror":"https://ror.org/00mkhxb43","country_code":"US","type":"education","lineage":["https://openalex.org/I107639228"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Collin McMillan","raw_affiliation_strings":["University of Notre Dame"],"affiliations":[{"raw_affiliation_string":"University of Notre Dame","institution_ids":["https://openalex.org/I107639228"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5019604003"],"corresponding_institution_ids":["https://openalex.org/I107639228"],"apc_list":null,"apc_paid":null,"fwci":28.1929,"has_fulltext":false,"cited_by_count":94,"citation_normalized_percentile":{"value":0.9970424,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"36","last_page":"47"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8616759777069092},{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.8254847526550293},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.663321852684021},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6461859345436096},{"id":"https://openalex.org/keywords/semantic-similarity","display_name":"Semantic similarity","score":0.6382907032966614},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.6228182911872864},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.6021106839179993},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5575105547904968},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.5543830394744873},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5415305495262146},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.531620442867279},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.5283570885658264},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5142359137535095},{"id":"https://openalex.org/keywords/documentation","display_name":"Documentation","score":0.5088079571723938},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4319208860397339},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.42147812247276306},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.20938122272491455}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8616759777069092},{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.8254847526550293},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.663321852684021},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6461859345436096},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.6382907032966614},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.6228182911872864},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.6021106839179993},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5575105547904968},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5543830394744873},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5415305495262146},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.531620442867279},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.5283570885658264},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5142359137535095},{"id":"https://openalex.org/C56666940","wikidata":"https://www.wikidata.org/wiki/Q788790","display_name":"Documentation","level":2,"score":0.5088079571723938},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4319208860397339},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.42147812247276306},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.20938122272491455},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3524610.3527909","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3524610.3527909","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3524610.3527909","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th IEEE/ACM International Conference on Program Comprehension","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3524610.3527909","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3524610.3527909","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3524610.3527909","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th IEEE/ACM International Conference on Program Comprehension","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.800000011920929,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4313185449.pdf","grobid_xml":"https://content.openalex.org/works/W4313185449.grobid-xml"},"referenced_works_count":61,"referenced_works":["https://openalex.org/W1614298861","https://openalex.org/W1976658129","https://openalex.org/W1978394996","https://openalex.org/W2007022086","https://openalex.org/W2013378101","https://openalex.org/W2014224954","https://openalex.org/W2018816078","https://openalex.org/W2028742638","https://openalex.org/W2053107307","https://openalex.org/W2082160726","https://openalex.org/W2101105183","https://openalex.org/W2106568252","https://openalex.org/W2109600226","https://openalex.org/W2117228548","https://openalex.org/W2123301721","https://openalex.org/W2123402141","https://openalex.org/W2131744502","https://openalex.org/W2133333349","https://openalex.org/W2142225512","https://openalex.org/W2157331557","https://openalex.org/W2165549065","https://openalex.org/W2166410494","https://openalex.org/W2166879716","https://openalex.org/W2294980783","https://openalex.org/W2612953412","https://openalex.org/W2753186769","https://openalex.org/W2806532810","https://openalex.org/W2887364112","https://openalex.org/W2896457183","https://openalex.org/W2914501196","https://openalex.org/W2928893288","https://openalex.org/W2949335953","https://openalex.org/W2949611393","https://openalex.org/W2963858034","https://openalex.org/W2963918774","https://openalex.org/W2965373594","https://openalex.org/W2970641574","https://openalex.org/W2979792666","https://openalex.org/W2992347006","https://openalex.org/W3014921686","https://openalex.org/W3016234956","https://openalex.org/W3034689979","https://openalex.org/W3085939759","https://openalex.org/W3086449553","https://openalex.org/W3103748122","https://openalex.org/W3107611171","https://openalex.org/W3119434107","https://openalex.org/W3195727321","https://openalex.org/W4243989635","https://openalex.org/W4244356278","https://openalex.org/W6649581940","https://openalex.org/W6681371269","https://openalex.org/W6682631176","https://openalex.org/W6684464451","https://openalex.org/W6691431627","https://openalex.org/W6739901393","https://openalex.org/W6741814560","https://openalex.org/W6749879876","https://openalex.org/W6753851271","https://openalex.org/W6761205521","https://openalex.org/W6806684424"],"related_works":["https://openalex.org/W2366403280","https://openalex.org/W1495108544","https://openalex.org/W2091301346","https://openalex.org/W3148229873","https://openalex.org/W4389760904","https://openalex.org/W2150160875","https://openalex.org/W4242223894","https://openalex.org/W4306886878","https://openalex.org/W2973759123","https://openalex.org/W1517524280"],"abstract_inverted_index":{"Source":[0],"code":[1,9,26,76,81,109,229],"summarization":[2,27],"involves":[3],"creating":[4],"brief":[5],"descriptions":[6,14],"of":[7,19,32,50,73,75,79,95,103,206,227],"source":[8,228],"in":[10,158,218],"natural":[11],"language.":[12],"These":[13],"are":[15,82,98],"a":[16,29,101,121,127,132,140,159],"key":[17],"component":[18],"software":[20,33],"documentation":[21,54],"such":[22,142],"as":[23,143],"JavaDocs.":[24],"Automatic":[25],"is":[28,59,108,118,129,134,153,172],"prized":[30],"target":[31],"engineering":[34],"research,":[35],"due":[36],"to":[37,43,84,120,131,192,196,203],"the":[38,46,92,96,113,116,162,179,194],"high":[39,48],"value":[40],"summaries":[41,78],"have":[42,161,168],"programmers":[44],"and":[45,52,77,115,165,208,222],"simultaneously":[47],"cost":[49],"writing":[51],"maintaining":[53],"by":[55,112,125,182],"hand.":[56],"Current":[57],"work":[58,217],"almost":[60],"all":[61,156],"based":[62,214],"on":[63,215],"machine":[64],"models":[65],"trained":[66],"via":[67,139],"big":[68],"data":[69],"input.":[70],"Large":[71],"datasets":[72],"examples":[74],"that":[80,154,173],"used":[83],"train":[85],"an":[86,190],"e.g.":[87],"encoder-decoder":[88],"neural":[89],"model.":[90],"Then":[91],"output":[93],"predictions":[94],"model":[97],"evaluated":[99],"against":[100],"set":[102],"reference":[104,133,209],"summaries.":[105,210],"The":[106,123,147,170],"input":[107],"not":[110,155,177],"seen":[111],"model,":[114],"prediction":[117,128],"compared":[119,130],"reference.":[122],"means":[124],"which":[126,197],"essentially":[135],"word":[136,151,199],"overlap,":[137],"calculated":[138,174],"metric":[141],"BLEU":[144],"or":[145],"ROUGE.":[146],"problem":[148],"with":[149],"using":[150],"overlap":[152,200],"words":[157,167],"sentence":[160],"same":[163],"importance,":[164],"many":[166],"synonyms.":[169],"result":[171],"similarity":[175,181,205,220],"may":[176],"match":[178],"perceived":[180],"human":[183],"readers.":[184],"In":[185],"this":[186],"paper,":[187],"we":[188],"conduct":[189],"experiment":[191],"measure":[193],"degree":[195],"various":[198],"metrics":[201,221],"correlate":[202],"human-rated":[204],"predicted":[207],"We":[211],"evaluate":[212],"alternatives":[213],"current":[216],"semantic":[219],"propose":[223],"recommendations":[224],"for":[225],"evaluation":[226],"summarization.":[230]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":35},{"year":2024,"cited_by_count":37},{"year":2023,"cited_by_count":20},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
