{"id":"https://openalex.org/W2981321698","doi":"https://doi.org/10.1145/3361242.3362699","title":"Extracting Code-relevant Description Sentences Based on Structural Similarity","display_name":"Extracting Code-relevant Description Sentences Based on Structural Similarity","publication_year":2019,"publication_date":"2019-10-24","ids":{"openalex":"https://openalex.org/W2981321698","doi":"https://doi.org/10.1145/3361242.3362699","mag":"2981321698"},"language":"en","primary_location":{"id":"doi:10.1145/3361242.3362699","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3361242.3362699","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 11th Asia-Pacific Symposium on Internetware","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087940448","display_name":"Yingkui Cao","orcid":null},"institutions":[{"id":"https://openalex.org/I4210092262","display_name":"Ministry of Education","ror":"https://ror.org/00dh5gw98","country_code":"RO","type":"funder","lineage":["https://openalex.org/I2799732796","https://openalex.org/I4210092262"]}],"countries":["RO"],"is_corresponding":true,"raw_author_name":"Yingkui Cao","raw_affiliation_strings":["Key Laboratory of High Confidence Software Technologies, Ministry of Education"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of High Confidence Software Technologies, Ministry of Education","institution_ids":["https://openalex.org/I4210092262"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103872660","display_name":"Yanzhen Zou","orcid":null},"institutions":[{"id":"https://openalex.org/I4210128818","display_name":"Institute of Software","ror":"https://ror.org/033dfsn42","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210128818"]},{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanzhen Zou","raw_affiliation_strings":["Key Laboratory of High Confidence Software Technologies, Ministry of Education, School of Electronics Engineering and Computer Science, Peking University, Beijing, China and Beida(Binhai) Information Research, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of High Confidence Software Technologies, Ministry of Education, School of Electronics Engineering and Computer Science, Peking University, Beijing, China and Beida(Binhai) Information Research, Tianjin, China","institution_ids":["https://openalex.org/I4210128818","https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102928967","display_name":"Bing Xie","orcid":"https://orcid.org/0000-0002-2988-2575"},"institutions":[{"id":"https://openalex.org/I4210092262","display_name":"Ministry of Education","ror":"https://ror.org/00dh5gw98","country_code":"RO","type":"funder","lineage":["https://openalex.org/I2799732796","https://openalex.org/I4210092262"]}],"countries":["RO"],"is_corresponding":false,"raw_author_name":"Bing Xie","raw_affiliation_strings":["Key Laboratory of High Confidence Software Technologies, Ministry of Education"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of High Confidence Software Technologies, Ministry of Education","institution_ids":["https://openalex.org/I4210092262"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5087940448"],"corresponding_institution_ids":["https://openalex.org/I4210092262"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.18427545,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8626177310943604},{"id":"https://openalex.org/keywords/snippet","display_name":"Snippet","score":0.6830207109451294},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.576943576335907},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5766679048538208},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5708622336387634},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5685936212539673},{"id":"https://openalex.org/keywords/program-comprehension","display_name":"Program comprehension","score":0.5490593314170837},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.5333698987960815},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.5016236305236816},{"id":"https://openalex.org/keywords/code-review","display_name":"Code review","score":0.48849236965179443},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.4806341230869293},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46026307344436646},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.44029533863067627},{"id":"https://openalex.org/keywords/documentation","display_name":"Documentation","score":0.41666197776794434},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.34233295917510986},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.3130539655685425},{"id":"https://openalex.org/keywords/static-program-analysis","display_name":"Static program analysis","score":0.20633485913276672},{"id":"https://openalex.org/keywords/software-development","display_name":"Software development","score":0.12906530499458313},{"id":"https://openalex.org/keywords/software-system","display_name":"Software system","score":0.11734899878501892},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.09626847505569458}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8626177310943604},{"id":"https://openalex.org/C2777822670","wikidata":"https://www.wikidata.org/wiki/Q1120538","display_name":"Snippet","level":2,"score":0.6830207109451294},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.576943576335907},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5766679048538208},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5708622336387634},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5685936212539673},{"id":"https://openalex.org/C2777561058","wikidata":"https://www.wikidata.org/wiki/Q2652119","display_name":"Program comprehension","level":4,"score":0.5490593314170837},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.5333698987960815},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.5016236305236816},{"id":"https://openalex.org/C150292731","wikidata":"https://www.wikidata.org/wiki/Q1342704","display_name":"Code review","level":5,"score":0.48849236965179443},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.4806341230869293},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46026307344436646},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.44029533863067627},{"id":"https://openalex.org/C56666940","wikidata":"https://www.wikidata.org/wiki/Q788790","display_name":"Documentation","level":2,"score":0.41666197776794434},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.34233295917510986},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.3130539655685425},{"id":"https://openalex.org/C137287247","wikidata":"https://www.wikidata.org/wiki/Q1329550","display_name":"Static program analysis","level":4,"score":0.20633485913276672},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.12906530499458313},{"id":"https://openalex.org/C149091818","wikidata":"https://www.wikidata.org/wiki/Q2429814","display_name":"Software system","level":3,"score":0.11734899878501892},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.09626847505569458},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3361242.3362699","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3361242.3362699","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 11th Asia-Pacific Symposium on Internetware","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.7300000190734863,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1566018662","https://openalex.org/W1596967103","https://openalex.org/W2023925487","https://openalex.org/W2034209539","https://openalex.org/W2061235289","https://openalex.org/W2081580037","https://openalex.org/W2112609142","https://openalex.org/W2153579005","https://openalex.org/W2250539671","https://openalex.org/W2366532918","https://openalex.org/W2593635859","https://openalex.org/W2601061983","https://openalex.org/W2745750801","https://openalex.org/W2759683881","https://openalex.org/W2774162863","https://openalex.org/W2788306232","https://openalex.org/W2794601162","https://openalex.org/W2795013376","https://openalex.org/W2802474178","https://openalex.org/W2908809453","https://openalex.org/W2914703977","https://openalex.org/W2964315653","https://openalex.org/W2983396602","https://openalex.org/W3087927280","https://openalex.org/W3098281910"],"related_works":["https://openalex.org/W2122804569","https://openalex.org/W4239900777","https://openalex.org/W4206927195","https://openalex.org/W4384811727","https://openalex.org/W2240979497","https://openalex.org/W3193746984","https://openalex.org/W2025599150","https://openalex.org/W2904997879","https://openalex.org/W2344367508","https://openalex.org/W3135060008"],"abstract_inverted_index":{"Software":[0],"developers":[1],"often":[2,28],"need":[3],"to":[4,17,20,37,68,102,163],"read":[5],"code":[6,25,42,49,56,81,124],"snippets":[7,26,125],"that":[8,112,155],"are":[9,27,35],"dispersed":[10],"among":[11],"different":[12],"documentation,":[13],"e.g.,":[14],"Q&A":[15],"posts,":[16],"reuse":[18],"APIs":[19],"complete":[21],"certain":[22],"tasks.":[23],"These":[24],"surrounded":[29],"by":[30],"lengthy":[31],"context":[32,74],"text":[33],"which":[34],"used":[36],"describe":[38],"the":[39,78,109,152],"functions":[40],"of":[41],"snippets.":[43],"It":[44],"will":[45],"be":[46],"helpful":[47],"for":[48],"comprehension":[50],"if":[51],"we":[52,64,87],"can":[53],"align":[54],"a":[55],"snippet":[57],"with":[58,90,139],"its":[59,73],"description.":[60],"In":[61,106,149],"this":[62],"paper,":[63],"propose":[65],"an":[66],"approach":[67,114,130,157],"extracting":[69],"code-relevant":[70,165],"sentences":[71],"from":[72],"text.":[75],"To":[76],"quantify":[77],"relevance":[79],"between":[80],"line":[82],"and":[83,93,118,126,142],"natural":[84],"language":[85],"sentence,":[86],"represent":[88],"them":[89],"structure":[91],"trees":[92],"calculate":[94],"their":[95],"structural":[96],"similarity.":[97],"We":[98],"conduct":[99],"two":[100],"experiments":[101],"evaluate":[103],"our":[104,113,156],"approach.":[105],"Experiment":[107,150],"I,":[108],"results":[110,153],"show":[111,154],"achieves":[115,131,158],"83.5%":[116],"precision":[117,137,162],"80.1%":[119],"recall":[120],"in":[121,136,147],"aligning":[122],"Lucene":[123],"corresponding":[127],"comments.":[128],"Our":[129],"27.6%":[132],"~":[133,144,160],"40.2%":[134],"improvement":[135,146],"compared":[138],"existing":[140],"method,":[141],"33.8%":[143],"39.7%":[145],"recall.":[148],"II,":[151],"66.4%":[159],"93.9%":[161],"extract":[164],"sentences.":[166]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
