{"id":"https://openalex.org/W1979655048","doi":"https://doi.org/10.1145/2597008.2597150","title":"Understanding LDA in source code analysis","display_name":"Understanding LDA in source code analysis","publication_year":2014,"publication_date":"2014-05-20","ids":{"openalex":"https://openalex.org/W1979655048","doi":"https://doi.org/10.1145/2597008.2597150","mag":"1979655048"},"language":"en","primary_location":{"id":"doi:10.1145/2597008.2597150","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2597008.2597150","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd International Conference on Program Comprehension","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008760456","display_name":"David Binkley","orcid":"https://orcid.org/0000-0003-0059-4024"},"institutions":[{"id":"https://openalex.org/I165556055","display_name":"Loyola University Maryland","ror":"https://ror.org/01by1wp65","country_code":"US","type":"education","lineage":["https://openalex.org/I165556055"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David Binkley","raw_affiliation_strings":["Loyola University Maryland, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Loyola University Maryland, USA","institution_ids":["https://openalex.org/I165556055"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051195404","display_name":"Daniel Heinz","orcid":"https://orcid.org/0000-0003-0321-0989"},"institutions":[{"id":"https://openalex.org/I165556055","display_name":"Loyola University Maryland","ror":"https://ror.org/01by1wp65","country_code":"US","type":"education","lineage":["https://openalex.org/I165556055"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Daniel Heinz","raw_affiliation_strings":["Loyola University Maryland, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Loyola University Maryland, USA","institution_ids":["https://openalex.org/I165556055"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037074105","display_name":"Dawn Lawrie","orcid":"https://orcid.org/0000-0001-7347-7086"},"institutions":[{"id":"https://openalex.org/I165556055","display_name":"Loyola University Maryland","ror":"https://ror.org/01by1wp65","country_code":"US","type":"education","lineage":["https://openalex.org/I165556055"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dawn Lawrie","raw_affiliation_strings":["Loyola University Maryland, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Loyola University Maryland, USA","institution_ids":["https://openalex.org/I165556055"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039091488","display_name":"Justin Overfelt","orcid":null},"institutions":[{"id":"https://openalex.org/I1322124587","display_name":"Booz Allen Hamilton (United States)","ror":"https://ror.org/051rcp357","country_code":"US","type":"company","lineage":["https://openalex.org/I1322124587"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Justin Overfelt","raw_affiliation_strings":["Booz Allen Hamilton, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Booz Allen Hamilton, USA","institution_ids":["https://openalex.org/I1322124587"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":18.0484,"has_fulltext":false,"cited_by_count":58,"citation_normalized_percentile":{"value":0.98970733,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"26","last_page":"36"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/latent-dirichlet-allocation","display_name":"Latent Dirichlet allocation","score":0.8183944821357727},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7417744994163513},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.699034571647644},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.6288152933120728},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5554434657096863},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.48492079973220825},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.42911022901535034},{"id":"https://openalex.org/keywords/work","display_name":"Work (physics)","score":0.42100009322166443},{"id":"https://openalex.org/keywords/comprehension","display_name":"Comprehension","score":0.41280245780944824},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.3711041510105133},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35476064682006836},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.12748342752456665},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.10392382740974426}],"concepts":[{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.8183944821357727},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7417744994163513},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.699034571647644},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.6288152933120728},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5554434657096863},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.48492079973220825},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.42911022901535034},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.42100009322166443},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.41280245780944824},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.3711041510105133},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35476064682006836},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.12748342752456665},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.10392382740974426},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2597008.2597150","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2597008.2597150","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd International Conference on Program Comprehension","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure","score":0.41999998688697815}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W1880262756","https://openalex.org/W1972420078","https://openalex.org/W1997650168","https://openalex.org/W2014116953","https://openalex.org/W2077776641","https://openalex.org/W2113772893","https://openalex.org/W2135541598","https://openalex.org/W2140264852","https://openalex.org/W2143818143","https://openalex.org/W2146341620","https://openalex.org/W2156701999","https://openalex.org/W2165401136","https://openalex.org/W6639619044"],"related_works":["https://openalex.org/W2888805565","https://openalex.org/W4312773271","https://openalex.org/W4315588616","https://openalex.org/W2769501189","https://openalex.org/W2962686197","https://openalex.org/W2207653751","https://openalex.org/W4293863151","https://openalex.org/W3159709618","https://openalex.org/W2611137333","https://openalex.org/W3005513013"],"abstract_inverted_index":{"Latent":[0],"Dirichlet":[1],"Allocation":[2],"(LDA)":[3],"has":[4],"seen":[5],"increasing":[6],"use":[7],"in":[8,18,102,185],"the":[9,34,43,55,67,81,88,98,110,121,132,147,151,160,168,171,174,189,198,201,205,218,232],"understanding":[10,187,237],"of":[11,21,66,73,90,100,112,123,170,188,217,238],"source":[12,161,225],"code":[13,162,226],"and":[14,105,163,167,196,204,227],"its":[15,22,164],"related":[16],"artifacts":[17],"part":[19],"because":[20,135],"impressive":[23],"modeling":[24],"power.":[25],"However,":[26],"this":[27,74,124,155],"expressive":[28],"power":[29,99],"comes":[30],"at":[31],"a":[32,60,228,235],"cost:":[33],"technique":[35],"includes":[36],"several":[37],"tuning":[38,82,133,191,202,243],"parameters":[39,134,192,203],"whose":[40],"impact":[41],"on":[42,146],"resulting":[44],"LDA":[45,101,190,206],"model":[46],"must":[47],"be":[48],"carefully":[49],"considered.":[50],"An":[51],"obvious":[52],"example":[53],"is":[54,76,116,126,137,180,211],"burn-in":[56,61],"period;":[57],"too":[58],"short":[59],"period":[62],"leaves":[63],"excessive":[64],"echoes":[65],"initial":[68],"uniform":[69],"distribution.":[70],"The":[71],"aim":[72],"work":[75,125],"to":[77,96,118,128,181,212,240],"provide":[78],"insights":[79],"into":[80],"parameter's":[83],"impact.":[84],"Doing":[85],"so":[86],"improves":[87],"comprehension":[89],"both,":[91],"1)":[92],"researchers":[93],"who":[94,108],"look":[95],"exploit":[97],"their":[103,186],"research":[104],"2)":[106],"those":[107],"interpret":[109],"output":[111],"LDA-using":[113],"tools.":[114],"It":[115],"important":[117],"recognize":[119],"that":[120],"goal":[122,179,210],"not":[127],"establish":[129],"values":[130],"for":[131,234],"there":[136],"no":[138],"universal":[139],"best":[140],"setting.":[141],"Rather,":[142],"appropriate":[143],"settings":[144],"depend":[145],"problem":[148],"being":[149],"solved,":[150],"input":[152],"corpus":[153,230],"(in":[154],"case,":[156],"typically":[157],"words":[158],"from":[159],"supporting":[165],"artifacts),":[166],"needs":[169],"engineer":[172],"performing":[173],"analysis.":[175],"This":[176],"work's":[177],"primary":[178],"aid":[182],"software":[183],"engineers":[184],"by":[193],"demonstrating":[194],"numerically":[195],"graphically":[197],"relationship":[199],"between":[200],"output.":[207],"A":[208],"secondary":[209],"enable":[213],"more":[214],"informed":[215],"setting":[216],"parameters.":[219,244],"Results":[220],"obtained":[221],"using":[222],"both":[223],"production":[224],"synthetic":[229],"underscore":[231],"need":[233],"solid":[236],"how":[239],"configure":[241],"LDA's":[242]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":8},{"year":2018,"cited_by_count":12},{"year":2017,"cited_by_count":6},{"year":2016,"cited_by_count":8},{"year":2015,"cited_by_count":6},{"year":2014,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
