{"id":"https://openalex.org/W4312782249","doi":"https://doi.org/10.1109/access.2022.3226238","title":"Predicting Duplicate in Bug Report Using Topic-Based Duplicate Learning With Fine Tuning-Based BERT Algorithm","display_name":"Predicting Duplicate in Bug Report Using Topic-Based Duplicate Learning With Fine Tuning-Based BERT Algorithm","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4312782249","doi":"https://doi.org/10.1109/access.2022.3226238"},"language":"en","primary_location":{"id":"doi:10.1109/access.2022.3226238","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2022.3226238","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2022.3226238","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Taemin Kim","orcid":"https://orcid.org/0000-0003-3493-2917"},"institutions":[{"id":"https://openalex.org/I71007489","display_name":"Kyungnam University","ror":"https://ror.org/037pkxm09","country_code":"KR","type":"education","lineage":["https://openalex.org/I71007489"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Taemin Kim","raw_affiliation_strings":["Department of Computer Science and Engineering, Kyungnam University, Changwon, South Korea","ORCiD"],"raw_orcid":"https://orcid.org/0000-0003-3493-2917","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Kyungnam University, Changwon, South Korea","institution_ids":["https://openalex.org/I71007489"]},{"raw_affiliation_string":"ORCiD","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033095132","display_name":"Geunseok Yang","orcid":"https://orcid.org/0000-0001-5677-5129"},"institutions":[{"id":"https://openalex.org/I71007489","display_name":"Kyungnam University","ror":"https://ror.org/037pkxm09","country_code":"KR","type":"education","lineage":["https://openalex.org/I71007489"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Geunseok Yang","raw_affiliation_strings":["Department of Computer Science and Engineering, Kyungnam University, Changwon, South Korea","ORCiD"],"raw_orcid":"https://orcid.org/0000-0001-5677-5129","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Kyungnam University, Changwon, South Korea","institution_ids":["https://openalex.org/I71007489"]},{"raw_affiliation_string":"ORCiD","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":4.1426,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.94729979,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"10","issue":null,"first_page":"129666","last_page":"129675"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9926000237464905,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8378338813781738},{"id":"https://openalex.org/keywords/software-regression","display_name":"Software regression","score":0.7210750579833984},{"id":"https://openalex.org/keywords/eclipse","display_name":"Eclipse","score":0.6008925437927246},{"id":"https://openalex.org/keywords/software-bug","display_name":"Software bug","score":0.581763744354248},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.4856890141963959},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4845925569534302},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.4753703474998474},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.43248164653778076},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.42346641421318054},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35680443048477173},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.2844015061855316},{"id":"https://openalex.org/keywords/software-development","display_name":"Software development","score":0.2269650101661682},{"id":"https://openalex.org/keywords/software-quality","display_name":"Software quality","score":0.20532187819480896},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1548754870891571}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8378338813781738},{"id":"https://openalex.org/C191727507","wikidata":"https://www.wikidata.org/wiki/Q24346","display_name":"Software regression","level":5,"score":0.7210750579833984},{"id":"https://openalex.org/C2778505590","wikidata":"https://www.wikidata.org/wiki/Q141022","display_name":"Eclipse","level":2,"score":0.6008925437927246},{"id":"https://openalex.org/C1009929","wikidata":"https://www.wikidata.org/wiki/Q179550","display_name":"Software bug","level":3,"score":0.581763744354248},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.4856890141963959},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4845925569534302},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.4753703474998474},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.43248164653778076},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.42346641421318054},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35680443048477173},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2844015061855316},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.2269650101661682},{"id":"https://openalex.org/C117447612","wikidata":"https://www.wikidata.org/wiki/Q1412670","display_name":"Software quality","level":4,"score":0.20532187819480896},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1548754870891571},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2022.3226238","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2022.3226238","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:c286853873284a95bbec00144e1f50d7","is_oa":true,"landing_page_url":"https://doaj.org/article/c286853873284a95bbec00144e1f50d7","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 10, Pp 129666-129675 (2022)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2022.3226238","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2022.3226238","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/17","score":0.4099999964237213,"display_name":"Partnerships for the goals"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321271","display_name":"Kyungnam University","ror":"https://ror.org/037pkxm09"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W9328536","https://openalex.org/W1584308190","https://openalex.org/W1881549354","https://openalex.org/W1966388643","https://openalex.org/W1981109290","https://openalex.org/W1999635750","https://openalex.org/W2044225531","https://openalex.org/W2045530509","https://openalex.org/W2047604680","https://openalex.org/W2090094826","https://openalex.org/W2099821052","https://openalex.org/W2123442489","https://openalex.org/W2130146200","https://openalex.org/W2136960485","https://openalex.org/W2149234515","https://openalex.org/W2156833313","https://openalex.org/W2165022036","https://openalex.org/W2293634267","https://openalex.org/W2795935179","https://openalex.org/W2896457183","https://openalex.org/W2908040686","https://openalex.org/W2944955910","https://openalex.org/W3006381853","https://openalex.org/W3149255455","https://openalex.org/W3163479207","https://openalex.org/W3195782437","https://openalex.org/W3195947713","https://openalex.org/W3216799472","https://openalex.org/W4300164480","https://openalex.org/W6635269506","https://openalex.org/W6639490048","https://openalex.org/W6696934422","https://openalex.org/W6755207826","https://openalex.org/W6771713106","https://openalex.org/W6795226064"],"related_works":["https://openalex.org/W3009111612","https://openalex.org/W2442359302","https://openalex.org/W2044225531","https://openalex.org/W2597543511","https://openalex.org/W3045036521","https://openalex.org/W2135303064","https://openalex.org/W2901462014","https://openalex.org/W3004570974","https://openalex.org/W2967225146","https://openalex.org/W2945475639"],"abstract_inverted_index":{"As":[0],"the":[1,45,48,51,60,76,81,93,107,110,124,130,148,173,177,182,188,208,279,288],"usage":[2],"and":[3,11,53,84,133,151,176,191,202,211,215,229,236,267,273],"coverage":[4],"of":[5,50,90,109],"software":[6],"increase,":[7],"various":[8],"functional":[9],"improvements":[10],"bugs":[12],"are":[13,74,154],"occurring.":[14],"The":[15,41,221],"Eclipse,":[16,212,233,264],"Mozilla":[17],"open-source":[18],"projects":[19],"receive":[20],"more":[21],"than":[22,287],"about":[23,225,269],"300":[24],"bug":[25,39,46,67,72,98,140,143,149,194],"reports":[26,73,99],"per":[27],"day.":[28],"Usually,":[29],"when":[30],"a":[31,34,38,65,88,139],"user":[32],"finds":[33],"bug,":[35,52,83],"they":[36],"write":[37],"report.":[40,68],"developer":[42,61,77,111],"assigned":[43],"to":[44,162,187,206],"reads":[47],"content":[49],"if":[54,70],"it":[55,63],"has":[56],"already":[57],"been":[58],"fixed,":[59],"marks":[62],"as":[64,185],"duplicate":[66,71,178,193],"However,":[69],"submitted,":[75],"must":[78],"manually":[79],"identify":[80],"same":[82],"this":[85,117,119,197],"process":[86],"requires":[87],"lot":[89],"effort":[91,105],"by":[92,142,156,158],"developer.":[94],"If":[95],"redundancies":[96],"in":[97,232,263],"can":[100,112],"be":[101,113],"identified":[102],"automatically,":[103],"unnecessary":[104],"on":[106],"part":[108],"reduced.":[114],"To":[115],"resolve":[116],"problem,":[118],"paper":[120],"predicts":[121,192],"redundancy":[122],"using":[123,172],"BERT":[125,189],"(Bidirectional":[126],"Encoder":[127],"Representations":[128],"from":[129,147],"Transformer)":[131],"algorithm":[132,190],"topic-based":[134],"duplicate/non-duplicate":[135],"feature":[136,168],"extraction.":[137],"First,":[138],"report":[141],"status":[144,157,175],"is":[145,170,282],"extracted":[146,183],"repository,":[150],"topic":[152,160],"models":[153],"constructed":[155],"applying":[159],"modeling":[161],"each":[163,166],"status.":[164,179],"In":[165,196,239],"topic,":[167],"selection":[169],"performed":[171],"non-duplicate":[174],"It":[180],"learns":[181],"features":[184],"inputs":[186],"reports.":[195],"paper,":[198],"Precision,":[199],"Recall,":[200],"F-measure,":[201],"Accuracy":[203],"were":[204,219],"used":[205],"evaluate":[207],"proposed":[209,222,280],"model,":[210],"Mozilla,":[213,234,265],"Apache,":[214,235,266],"KDE":[216,268],"open":[217],"sources":[218],"used.":[220],"model":[223,281],"shows":[224],"87.67%,":[226],"89.85%,":[227],"87.03%,":[228],"88.95%":[230],"performance":[231,241],"KDE,":[237],"respectively.":[238],"addition,":[240],"comparison":[242],"with":[243],"baselines":[244],"(Na\u00efve":[245],"Bayes,":[246],"Randomforest,":[247],"Convolutional":[248,256],"Neural":[249,257],"Network":[250],"(CNN),":[251],"Long":[252],"Short-Term":[253,259],"Memory":[254,260],"(LSTM),":[255],"Networks-Long":[258],"Networks":[261],"(CNN-LSTM))":[262],"36.33%,":[270],"44.46%,":[271],"47.77%,":[272],"45.17%,":[274],"improvement,":[275],"respectively,":[276],"showed":[277],"that":[278],"better":[283],"at":[284],"detecting":[285],"duplicates":[286],"baselines.":[289]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":4}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
