{"id":"https://openalex.org/W4399668292","doi":"https://doi.org/10.1145/3661167.3661168","title":"LEGION: Harnessing Pre-trained Language Models for GitHub Topic Recommendations with Distribution-Balance Loss","display_name":"LEGION: Harnessing Pre-trained Language Models for GitHub Topic Recommendations with Distribution-Balance Loss","publication_year":2024,"publication_date":"2024-06-14","ids":{"openalex":"https://openalex.org/W4399668292","doi":"https://doi.org/10.1145/3661167.3661168"},"language":"en","primary_location":{"id":"doi:10.1145/3661167.3661168","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3661167.3661168","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th International Conference on Evaluation and Assessment in Software Engineering","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3661167.3661168","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5018743003","display_name":"Yen-Trang Dang","orcid":"https://orcid.org/0009-0001-2781-9652"},"institutions":[{"id":"https://openalex.org/I94518387","display_name":"Hanoi University of Science and Technology","ror":"https://ror.org/04nyv3z04","country_code":"VN","type":"education","lineage":["https://openalex.org/I94518387"]}],"countries":["VN"],"is_corresponding":true,"raw_author_name":"Yen-Trang Dang","raw_affiliation_strings":["Hanoi University of Science and Technology, Viet Nam"],"raw_orcid":"https://orcid.org/0009-0001-2781-9652","affiliations":[{"raw_affiliation_string":"Hanoi University of Science and Technology, Viet Nam","institution_ids":["https://openalex.org/I94518387"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013306670","display_name":"Thanh Le-Cong","orcid":"https://orcid.org/0000-0002-9566-324X"},"institutions":[{"id":"https://openalex.org/I165779595","display_name":"The University of Melbourne","ror":"https://ror.org/01ej9dk98","country_code":"AU","type":"education","lineage":["https://openalex.org/I165779595"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Thanh Le-Cong","raw_affiliation_strings":["The University of Melbourne, Australia"],"raw_orcid":"https://orcid.org/0000-0002-9566-324X","affiliations":[{"raw_affiliation_string":"The University of Melbourne, Australia","institution_ids":["https://openalex.org/I165779595"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048071520","display_name":"Phuc-Thanh Nguyen","orcid":"https://orcid.org/0009-0001-5440-6757"},"institutions":[{"id":"https://openalex.org/I26415053","display_name":"University of L'Aquila","ror":"https://ror.org/01j9p1r26","country_code":"IT","type":"education","lineage":["https://openalex.org/I26415053"]},{"id":"https://openalex.org/I94518387","display_name":"Hanoi University of Science and Technology","ror":"https://ror.org/04nyv3z04","country_code":"VN","type":"education","lineage":["https://openalex.org/I94518387"]}],"countries":["IT","VN"],"is_corresponding":false,"raw_author_name":"Phuc-Thanh Nguyen","raw_affiliation_strings":["Hanoi University of Science and Technology, Viet Nam","University of L'Aquila, Italy"],"raw_orcid":"https://orcid.org/0009-0001-5440-6757","affiliations":[{"raw_affiliation_string":"Hanoi University of Science and Technology, Viet Nam","institution_ids":["https://openalex.org/I94518387"]},{"raw_affiliation_string":"University of L'Aquila, Italy","institution_ids":["https://openalex.org/I26415053"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021818134","display_name":"Anh M. T. Bui","orcid":"https://orcid.org/0000-0001-7877-9438"},"institutions":[{"id":"https://openalex.org/I94518387","display_name":"Hanoi University of Science and Technology","ror":"https://ror.org/04nyv3z04","country_code":"VN","type":"education","lineage":["https://openalex.org/I94518387"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Anh M. T. Bui","raw_affiliation_strings":["Hanoi University of Science and Technology, Viet Nam"],"raw_orcid":"https://orcid.org/0000-0001-7877-9438","affiliations":[{"raw_affiliation_string":"Hanoi University of Science and Technology, Viet Nam","institution_ids":["https://openalex.org/I94518387"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023235306","display_name":"Phuong T. Nguyen","orcid":"https://orcid.org/0000-0002-3666-4162"},"institutions":[{"id":"https://openalex.org/I26415053","display_name":"University of L'Aquila","ror":"https://ror.org/01j9p1r26","country_code":"IT","type":"education","lineage":["https://openalex.org/I26415053"]},{"id":"https://openalex.org/I94518387","display_name":"Hanoi University of Science and Technology","ror":"https://ror.org/04nyv3z04","country_code":"VN","type":"education","lineage":["https://openalex.org/I94518387"]}],"countries":["IT","VN"],"is_corresponding":false,"raw_author_name":"Phuong T. Nguyen","raw_affiliation_strings":["Hanoi University of Science and Technology, Viet Nam","University of L'Aquila, Italy"],"raw_orcid":"https://orcid.org/0000-0002-3666-4162","affiliations":[{"raw_affiliation_string":"Hanoi University of Science and Technology, Viet Nam","institution_ids":["https://openalex.org/I94518387"]},{"raw_affiliation_string":"University of L'Aquila, Italy","institution_ids":["https://openalex.org/I26415053"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075260906","display_name":"Xuan-Bach D. Le","orcid":"https://orcid.org/0000-0001-5044-1582"},"institutions":[{"id":"https://openalex.org/I165779595","display_name":"The University of Melbourne","ror":"https://ror.org/01ej9dk98","country_code":"AU","type":"education","lineage":["https://openalex.org/I165779595"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Bach Le","raw_affiliation_strings":["The University of Melbourne, Australia"],"raw_orcid":"https://orcid.org/0000-0001-5044-1582","affiliations":[{"raw_affiliation_string":"The University of Melbourne, Australia","institution_ids":["https://openalex.org/I165779595"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5071728979","display_name":"Hu\u1ef3nh Quy\u1ebft Th\u1eafng","orcid":"https://orcid.org/0000-0002-0788-6380"},"institutions":[{"id":"https://openalex.org/I94518387","display_name":"Hanoi University of Science and Technology","ror":"https://ror.org/04nyv3z04","country_code":"VN","type":"education","lineage":["https://openalex.org/I94518387"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Quyet-Thang Huynh","raw_affiliation_strings":["Hanoi University of Science and Technology, Viet Nam"],"raw_orcid":"https://orcid.org/0000-0002-0788-6380","affiliations":[{"raw_affiliation_string":"Hanoi University of Science and Technology, Viet Nam","institution_ids":["https://openalex.org/I94518387"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5018743003"],"corresponding_institution_ids":["https://openalex.org/I94518387"],"apc_list":null,"apc_paid":null,"fwci":0.3311,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.6290302,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"181","last_page":"190"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.779995322227478},{"id":"https://openalex.org/keywords/balance","display_name":"Balance (ability)","score":0.6056500673294067},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.488557904958725},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.42095404863357544},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.34648796916007996},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.33776795864105225},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.33346229791641235},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.06533530354499817}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.779995322227478},{"id":"https://openalex.org/C168031717","wikidata":"https://www.wikidata.org/wiki/Q1530280","display_name":"Balance (ability)","level":2,"score":0.6056500673294067},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.488557904958725},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.42095404863357544},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34648796916007996},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.33776795864105225},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.33346229791641235},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.06533530354499817},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3661167.3661168","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3661167.3661168","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th International Conference on Evaluation and Assessment in Software Engineering","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3661167.3661168","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3661167.3661168","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th International Conference on Evaluation and Assessment in Software Engineering","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.4699999988079071,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W61851215","https://openalex.org/W1566289585","https://openalex.org/W2075924051","https://openalex.org/W2096287423","https://openalex.org/W2124100711","https://openalex.org/W2145512597","https://openalex.org/W2168248828","https://openalex.org/W2514084604","https://openalex.org/W2621924596","https://openalex.org/W2738381526","https://openalex.org/W2784876765","https://openalex.org/W2963351448","https://openalex.org/W2971330564","https://openalex.org/W2997591727","https://openalex.org/W3022599808","https://openalex.org/W3034999214","https://openalex.org/W3093959336","https://openalex.org/W3094045953","https://openalex.org/W3096150021","https://openalex.org/W3121707215","https://openalex.org/W3165920028","https://openalex.org/W3172444956","https://openalex.org/W3177724167","https://openalex.org/W3201658153","https://openalex.org/W4200633062","https://openalex.org/W4221159558","https://openalex.org/W4229643319","https://openalex.org/W4234346598","https://openalex.org/W4297677548","https://openalex.org/W4300164480","https://openalex.org/W4313547549","https://openalex.org/W4313563649","https://openalex.org/W4313563756","https://openalex.org/W4376606916","https://openalex.org/W4382246105","https://openalex.org/W4384345689","https://openalex.org/W4386080933","https://openalex.org/W4388483049"],"related_works":["https://openalex.org/W2386367800","https://openalex.org/W2169518243","https://openalex.org/W2353574976","https://openalex.org/W1824021510","https://openalex.org/W4384702906","https://openalex.org/W2360150702","https://openalex.org/W2360176913","https://openalex.org/W2023046755","https://openalex.org/W2358150182","https://openalex.org/W4231937131"],"abstract_inverted_index":{"Open-source":[0],"development":[1,38],"has":[2],"revolutionized":[3],"the":[4,42,45],"software":[5,37],"industry":[6],"by":[7,68],"promoting":[8],"collaboration,":[9],"transparency,":[10],"and":[11,71],"community-driven":[12],"innovation.":[13],"Today,":[14],"a":[15,35],"vast":[16],"amount":[17],"of":[18,21,27,44,50],"various":[19],"kinds":[20],"open-source":[22],"software,":[23],"which":[24],"form":[25],"networks":[26],"repositories,":[28,52],"is":[29,74],"often":[30],"hosted":[31],"on":[32,93],"GitHub":[33,53,83],"\u2013":[34],"popular":[36],"platform.":[39],"To":[40],"enhance":[41],"discoverability":[43],"repository":[46,55],"networks,":[47],"i.e.,":[48],"groups":[49],"similar":[51],"introduced":[54],"topics":[56,80],"in":[57,101],"2017":[58],"that":[59],"enable":[60],"users":[61],"to":[62,77],"more":[63],"easily":[64],"explore":[65],"relevant":[66],"projects":[67],"type,":[69],"technology,":[70],"more.":[72],"It":[73],"thus":[75],"crucial":[76],"accurately":[78],"assign":[79],"for":[81,87,95],"each":[82],"repository.":[84],"Current":[85],"methods":[86],"automatic":[88],"topic":[89],"recommendation":[90],"rely":[91],"heavily":[92],"TF-IDF":[94],"encoding":[96],"textual":[97],"data,":[98],"presenting":[99],"challenges":[100],"understanding":[102],"semantic":[103],"nuances.":[104]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
