{"id":"https://openalex.org/W2756599087","doi":"https://doi.org/10.1145/3131704.3131713","title":"Document Distance Estimation via Code Graph Embedding","display_name":"Document Distance Estimation via Code Graph Embedding","publication_year":2017,"publication_date":"2017-09-23","ids":{"openalex":"https://openalex.org/W2756599087","doi":"https://doi.org/10.1145/3131704.3131713","mag":"2756599087"},"language":"en","primary_location":{"id":"doi:10.1145/3131704.3131713","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3131704.3131713","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 9th Asia-Pacific Symposium on Internetware","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5061546771","display_name":"Zeqi Lin","orcid":"https://orcid.org/0009-0001-2563-7601"},"institutions":[{"id":"https://openalex.org/I4210128818","display_name":"Institute of Software","ror":"https://ror.org/033dfsn42","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210128818"]},{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zeqi Lin","raw_affiliation_strings":["Key Laboratory of High Confidence Software Technologies, Ministry of Education, Beijing, China and School of Electronics Engineering and Computer Science, Peking University, Beijing, China and Beida(Binhai) Information Research, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of High Confidence Software Technologies, Ministry of Education, Beijing, China and School of Electronics Engineering and Computer Science, Peking University, Beijing, China and Beida(Binhai) Information Research, Tianjin, China","institution_ids":["https://openalex.org/I4210128818","https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009946754","display_name":"Junfeng Zhao","orcid":"https://orcid.org/0000-0002-1268-5006"},"institutions":[{"id":"https://openalex.org/I4210128818","display_name":"Institute of Software","ror":"https://ror.org/033dfsn42","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210128818"]},{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junfeng Zhao","raw_affiliation_strings":["Key Laboratory of High Confidence Software Technologies, Ministry of Education, Beijing, China and School of Electronics Engineering and Computer Science, Peking University, Beijing, China and Beida(Binhai) Information Research, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of High Confidence Software Technologies, Ministry of Education, Beijing, China and School of Electronics Engineering and Computer Science, Peking University, Beijing, China and Beida(Binhai) Information Research, Tianjin, China","institution_ids":["https://openalex.org/I4210128818","https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103872660","display_name":"Yanzhen Zou","orcid":null},"institutions":[{"id":"https://openalex.org/I4210128818","display_name":"Institute of Software","ror":"https://ror.org/033dfsn42","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210128818"]},{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanzhen Zou","raw_affiliation_strings":["Key Laboratory of High Confidence Software Technologies, Ministry of Education, Beijing, China and School of Electronics Engineering and Computer Science, Peking University, Beijing, China and Beida(Binhai) Information Research, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of High Confidence Software Technologies, Ministry of Education, Beijing, China and School of Electronics Engineering and Computer Science, Peking University, Beijing, China and Beida(Binhai) Information Research, Tianjin, China","institution_ids":["https://openalex.org/I4210128818","https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102928967","display_name":"Bing Xie","orcid":"https://orcid.org/0000-0002-2988-2575"},"institutions":[{"id":"https://openalex.org/I4210128818","display_name":"Institute of Software","ror":"https://ror.org/033dfsn42","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210128818"]},{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bing Xie","raw_affiliation_strings":["Key Laboratory of High Confidence Software Technologies, Ministry of Education, Beijing, China and School of Electronics Engineering and Computer Science, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of High Confidence Software Technologies, Ministry of Education, Beijing, China and School of Electronics Engineering and Computer Science, Peking University, Beijing, China","institution_ids":["https://openalex.org/I4210128818","https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5061546771"],"corresponding_institution_ids":["https://openalex.org/I20231570","https://openalex.org/I4210128818"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.16810219,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"6","issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9886999726295471,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8491860628128052},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5797942876815796},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.5215001702308655},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4985771179199219},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4926939308643341},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.48927947878837585},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.4794536828994751},{"id":"https://openalex.org/keywords/traceability","display_name":"Traceability","score":0.46956586837768555},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.442821204662323},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4386168122291565},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4316890239715576},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.4273189902305603},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.34608426690101624},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.26119327545166016},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.1961384415626526},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.14331045746803284}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8491860628128052},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5797942876815796},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.5215001702308655},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4985771179199219},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4926939308643341},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.48927947878837585},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.4794536828994751},{"id":"https://openalex.org/C153876917","wikidata":"https://www.wikidata.org/wiki/Q899704","display_name":"Traceability","level":2,"score":0.46956586837768555},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.442821204662323},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4386168122291565},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4316890239715576},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.4273189902305603},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34608426690101624},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.26119327545166016},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.1961384415626526},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.14331045746803284},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3131704.3131713","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3131704.3131713","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 9th Asia-Pacific Symposium on Internetware","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W68132019","https://openalex.org/W1559169059","https://openalex.org/W1566018662","https://openalex.org/W1660390307","https://openalex.org/W1880262756","https://openalex.org/W1981109290","https://openalex.org/W1985947101","https://openalex.org/W1997650168","https://openalex.org/W2014116953","https://openalex.org/W2017485217","https://openalex.org/W2017593508","https://openalex.org/W2026608875","https://openalex.org/W2038847163","https://openalex.org/W2040043446","https://openalex.org/W2050372846","https://openalex.org/W2050396504","https://openalex.org/W2063384185","https://openalex.org/W2073587810","https://openalex.org/W2089759055","https://openalex.org/W2097001189","https://openalex.org/W2098162425","https://openalex.org/W2100739938","https://openalex.org/W2110008837","https://openalex.org/W2110220994","https://openalex.org/W2116737258","https://openalex.org/W2122060876","https://openalex.org/W2125101937","https://openalex.org/W2127426251","https://openalex.org/W2127795553","https://openalex.org/W2139543149","https://openalex.org/W2140255470","https://openalex.org/W2147152072","https://openalex.org/W2148484494","https://openalex.org/W2150240046","https://openalex.org/W2153546999","https://openalex.org/W2156833313","https://openalex.org/W2184957013","https://openalex.org/W2247119764","https://openalex.org/W2251558607","https://openalex.org/W2283196293","https://openalex.org/W2387719207","https://openalex.org/W2401290433","https://openalex.org/W2513738415","https://openalex.org/W2539033431","https://openalex.org/W2998704965","https://openalex.org/W3147133761","https://openalex.org/W3149255455","https://openalex.org/W4250687526","https://openalex.org/W4285719527","https://openalex.org/W6680532216"],"related_works":["https://openalex.org/W2378709054","https://openalex.org/W4380301954","https://openalex.org/W2803090313","https://openalex.org/W1482465488","https://openalex.org/W2052375654","https://openalex.org/W2376767034","https://openalex.org/W2350918606","https://openalex.org/W2982483023","https://openalex.org/W2049082574","https://openalex.org/W3081644756"],"abstract_inverted_index":{"Accurately":[0],"representing":[1],"the":[2,108,113,136],"distance":[3,59,114,122],"between":[4,68,94,115],"two":[5,116],"documents":[6,42,69,99,117],"(i.e.":[7],"pieces":[8],"of":[9,104,138],"textual":[10],"information":[11,73],"extracted":[12],"from":[13],"various":[14],"software":[15,23,75],"artifacts)":[16],"has":[17],"far-reaching":[18],"applications":[19],"in":[20,74,85,107,131],"many":[21],"automated":[22],"engineering":[24],"approaches,":[25],"such":[26],"as":[27,83,100],"concept":[28],"location,":[29],"bug":[30],"location":[31],"and":[32,111],"traceability":[33],"link":[34],"recovery.":[35],"This":[36,62],"is":[37],"a":[38,56,86,127],"challenging":[39],"task,":[40],"since":[41],"containing":[43],"different":[44],"words":[45],"may":[46],"have":[47],"similar":[48],"semantic":[49,66],"meanings.":[50],"In":[51],"this":[52],"paper,":[53],"we":[54,79,97],"propose":[55],"novel":[57],"document":[58,128],"estimation":[60],"approach.":[61,140],"approach":[63,148],"captures":[64],"latent":[65],"associations":[67],"through":[70],"analyzing":[71],"structural":[72,92],"source":[76],"code:":[77],"first,":[78],"embed":[80],"code":[81,105],"elements":[82,106],"points":[84],"shared":[87],"representation":[88,109],"space":[89,110],"according":[90],"to":[91,118,134],"dependencies":[93],"them;":[95],"then,":[96],"represent":[98],"weighted":[101],"point":[102],"clouds":[103],"reduce":[112],"an":[119],"earth":[120],"mover's":[121],"transportation":[123],"problem.":[124],"We":[125],"define":[126],"classification":[129],"task":[130],"StackOverflow":[132],"dataset":[133],"evaluate":[135],"effectiveness":[137],"our":[139,147],"The":[141],"empirical":[142],"evaluation":[143],"results":[144],"show":[145],"that":[146],"outperforms":[149],"several":[150],"state-of-the-art":[151],"approaches.":[152]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
