{"id":"https://openalex.org/W2967047440","doi":"https://doi.org/10.1145/3338906.3338963","title":"A learning-based approach for automatic construction of domain glossary from source code and documentation","display_name":"A learning-based approach for automatic construction of domain glossary from source code and documentation","publication_year":2019,"publication_date":"2019-08-09","ids":{"openalex":"https://openalex.org/W2967047440","doi":"https://doi.org/10.1145/3338906.3338963","mag":"2967047440"},"language":"en","primary_location":{"id":"doi:10.1145/3338906.3338963","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3338906.3338963","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2019 27th ACM Joint Meeting on European Software Engineering Conference and Symposium on the Foundations of Software Engineering","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100329466","display_name":"Chong Wang","orcid":"https://orcid.org/0000-0003-1424-6290"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chong Wang","raw_affiliation_strings":["Fudan University, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101854992","display_name":"Xin Peng","orcid":"https://orcid.org/0000-0003-3376-2581"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Peng","raw_affiliation_strings":["Fudan University, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100697907","display_name":"Mingwei Liu","orcid":"https://orcid.org/0000-0002-3462-997X"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingwei Liu","raw_affiliation_strings":["Fudan University, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028641941","display_name":"Zhenchang Xing","orcid":"https://orcid.org/0000-0001-7663-1421"},"institutions":[{"id":"https://openalex.org/I118347636","display_name":"Australian National University","ror":"https://ror.org/019wvm592","country_code":"AU","type":"education","lineage":["https://openalex.org/I118347636"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Zhenchang Xing","raw_affiliation_strings":["Australian National University, Australia"],"affiliations":[{"raw_affiliation_string":"Australian National University, Australia","institution_ids":["https://openalex.org/I118347636"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064710609","display_name":"Xuefang Bai","orcid":null},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuefang Bai","raw_affiliation_strings":["Fudan University, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102928967","display_name":"Bing Xie","orcid":"https://orcid.org/0000-0002-2988-2575"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bing Xie","raw_affiliation_strings":["Peking University, China"],"affiliations":[{"raw_affiliation_string":"Peking University, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101616845","display_name":"Tuo Wang","orcid":"https://orcid.org/0000-0003-2308-2419"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tuo Wang","raw_affiliation_strings":["Fudan University, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5100329466"],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":9.8354,"has_fulltext":false,"cited_by_count":50,"citation_normalized_percentile":{"value":0.98056064,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"97","last_page":"108"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/glossary","display_name":"Glossary","score":0.8693121671676636},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8311800956726074},{"id":"https://openalex.org/keywords/documentation","display_name":"Documentation","score":0.6634323596954346},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6156041026115417},{"id":"https://openalex.org/keywords/identifier","display_name":"Identifier","score":0.6109669804573059},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.6035366654396057},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5022263526916504},{"id":"https://openalex.org/keywords/software-documentation","display_name":"Software documentation","score":0.5007524490356445},{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.4820728898048401},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.47136107087135315},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.46000319719314575},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.453583300113678},{"id":"https://openalex.org/keywords/internal-documentation","display_name":"Internal documentation","score":0.4375479519367218},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.4299446940422058},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.41758596897125244},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.40921205282211304},{"id":"https://openalex.org/keywords/software-development","display_name":"Software development","score":0.30087658762931824},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.2104271650314331},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.17750892043113708},{"id":"https://openalex.org/keywords/software-development-process","display_name":"Software development process","score":0.166214257478714},{"id":"https://openalex.org/keywords/software-construction","display_name":"Software construction","score":0.10604351758956909}],"concepts":[{"id":"https://openalex.org/C2780031656","wikidata":"https://www.wikidata.org/wiki/Q859161","display_name":"Glossary","level":2,"score":0.8693121671676636},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8311800956726074},{"id":"https://openalex.org/C56666940","wikidata":"https://www.wikidata.org/wiki/Q788790","display_name":"Documentation","level":2,"score":0.6634323596954346},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6156041026115417},{"id":"https://openalex.org/C154504017","wikidata":"https://www.wikidata.org/wiki/Q853614","display_name":"Identifier","level":2,"score":0.6109669804573059},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.6035366654396057},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5022263526916504},{"id":"https://openalex.org/C81587897","wikidata":"https://www.wikidata.org/wiki/Q181702","display_name":"Software documentation","level":5,"score":0.5007524490356445},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.4820728898048401},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.47136107087135315},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.46000319719314575},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.453583300113678},{"id":"https://openalex.org/C140396857","wikidata":"https://www.wikidata.org/wiki/Q16934771","display_name":"Internal documentation","level":5,"score":0.4375479519367218},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.4299446940422058},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.41758596897125244},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.40921205282211304},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.30087658762931824},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2104271650314331},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.17750892043113708},{"id":"https://openalex.org/C180152950","wikidata":"https://www.wikidata.org/wiki/Q2904257","display_name":"Software development process","level":4,"score":0.166214257478714},{"id":"https://openalex.org/C186846655","wikidata":"https://www.wikidata.org/wiki/Q3398377","display_name":"Software construction","level":4,"score":0.10604351758956909},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3338906.3338963","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3338906.3338963","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2019 27th ACM Joint Meeting on European Software Engineering Conference and Symposium on the Foundations of Software Engineering","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W43804564","https://openalex.org/W579397108","https://openalex.org/W1539495021","https://openalex.org/W1849984936","https://openalex.org/W1964968887","https://openalex.org/W1973583889","https://openalex.org/W1992587390","https://openalex.org/W2004763266","https://openalex.org/W2007264217","https://openalex.org/W2018360580","https://openalex.org/W2026608875","https://openalex.org/W2045044649","https://openalex.org/W2066792529","https://openalex.org/W2068737686","https://openalex.org/W2116266212","https://openalex.org/W2120755390","https://openalex.org/W2122060876","https://openalex.org/W2158018156","https://openalex.org/W2177607365","https://openalex.org/W2250539671","https://openalex.org/W2296283641","https://openalex.org/W2366532918","https://openalex.org/W2406204547","https://openalex.org/W2406365535","https://openalex.org/W2553146174","https://openalex.org/W2558786277","https://openalex.org/W2560147852","https://openalex.org/W2600834311","https://openalex.org/W2617307387","https://openalex.org/W2767532479","https://openalex.org/W2767563557","https://openalex.org/W2767782162","https://openalex.org/W2794354396","https://openalex.org/W2889792925","https://openalex.org/W2897987981","https://openalex.org/W2901934569","https://openalex.org/W2964064835","https://openalex.org/W2997181101","https://openalex.org/W4241395538","https://openalex.org/W4248426528","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W3120493416","https://openalex.org/W2602989241","https://openalex.org/W2112489737","https://openalex.org/W2098192829","https://openalex.org/W2764664989","https://openalex.org/W2108337646","https://openalex.org/W2035042871","https://openalex.org/W2646159910","https://openalex.org/W2404091770","https://openalex.org/W2767775279"],"abstract_inverted_index":{"A":[0],"domain":[1,30,55,146,149,171],"glossary":[2,56,89,172],"that":[3],"organizes":[4],"domain-specific":[5,84,102],"concepts":[6,112,155],"and":[7,10,17,36,60,76,95,126,132,147,150,153,159,173,179],"their":[8,114],"aliases":[9,108],"relations":[11,135,161],"is":[12,40],"essential":[13],"for":[14,51,123,176],"knowledge":[15,182],"acquisition":[16,180],"software":[18,34,61],"development.":[19],"Existing":[20],"approaches":[21],"use":[22],"linguistic":[23],"heuristics":[24],"or":[25],"term-frequency-based":[26],"statistics":[27],"to":[28,81,87,113,143],"identify":[29],"specific":[31],"terms":[32,71,90],"from":[33,57,73,183],"documentation,":[35],"thus":[37],"the":[38,93,99,107,110,137,166,169,177],"accuracy":[39,167],"often":[41],"low.":[42],"In":[43],"this":[44],"paper,":[45],"we":[46],"propose":[47],"a":[48,66,83,118],"learning-based":[49],"approach":[50,64,142],"automatic":[52],"construction":[53],"of":[54,68,98,109,120,168,181,186],"source":[58],"code":[59,74],"documentation.":[62],"The":[63],"uses":[65],"set":[67,119],"high-quality":[69],"seed":[70],"identified":[72],"identifiers":[75],"natural":[77],"language":[78],"concept":[79],"definitions":[80],"train":[82],"prediction":[85],"model":[86],"recognize":[88],"based":[91],"on":[92],"lexical":[94],"semantic":[96],"context":[97],"sentences":[100,122],"mentioning":[101],"concepts.":[103,138],"It":[104],"then":[105],"merges":[106],"same":[111],"canonical":[115],"names,":[116],"selects":[117],"explanation":[121],"each":[124],"concept,":[125],"identifies":[127],"\"is":[128],"a\",":[129,131],"\"has":[130],"\"related":[133],"to\"":[134],"between":[136],"We":[139],"apply":[140],"our":[141],"deep":[144],"learning":[145],"Hadoop":[148],"harvest":[151],"5,382":[152],"2,069":[154],"together":[156],"with":[157],"16,962":[158],"6,815":[160],"respectively.":[162],"Our":[163],"evaluation":[164],"validates":[165],"extracted":[170],"its":[174],"usefulness":[175],"fusion":[178],"different":[184,187],"documents":[185],"projects.":[188]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":13},{"year":2022,"cited_by_count":10},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":8},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
