{"id":"https://openalex.org/W4414017375","doi":"https://doi.org/10.1007/s00521-025-11593-9","title":"Large language models for efficient topic modeling","display_name":"Large language models for efficient topic modeling","publication_year":2025,"publication_date":"2025-09-05","ids":{"openalex":"https://openalex.org/W4414017375","doi":"https://doi.org/10.1007/s00521-025-11593-9"},"language":"en","primary_location":{"id":"doi:10.1007/s00521-025-11593-9","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-025-11593-9","pdf_url":null,"source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1007/s00521-025-11593-9","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075066824","display_name":"Panagiotis C. Theocharopoulos","orcid":"https://orcid.org/0000-0002-8607-5518"},"institutions":[{"id":"https://openalex.org/I145722265","display_name":"University of Thessaly","ror":"https://ror.org/04v4g9h31","country_code":"GR","type":"education","lineage":["https://openalex.org/I145722265"]}],"countries":["GR"],"is_corresponding":true,"raw_author_name":"Panagiotis C. Theocharopoulos","raw_affiliation_strings":["Department of Computer Science and Biomedical \u0399nformatics, University of Thessaly, 2-4 Papasiopoulou Street, 35131, Lamia, Greece"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Biomedical \u0399nformatics, University of Thessaly, 2-4 Papasiopoulou Street, 35131, Lamia, Greece","institution_ids":["https://openalex.org/I145722265"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050339315","display_name":"Panagiotis Anagnostou","orcid":"https://orcid.org/0000-0002-4775-9220"},"institutions":[{"id":"https://openalex.org/I145722265","display_name":"University of Thessaly","ror":"https://ror.org/04v4g9h31","country_code":"GR","type":"education","lineage":["https://openalex.org/I145722265"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Panagiotis Anagnostou","raw_affiliation_strings":["Department of Computer Science and Biomedical \u0399nformatics, University of Thessaly, 2-4 Papasiopoulou Street, 35131, Lamia, Greece"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Biomedical \u0399nformatics, University of Thessaly, 2-4 Papasiopoulou Street, 35131, Lamia, Greece","institution_ids":["https://openalex.org/I145722265"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085640042","display_name":"Spiros V. Georgakopoulos","orcid":"https://orcid.org/0000-0002-3374-0422"},"institutions":[{"id":"https://openalex.org/I145722265","display_name":"University of Thessaly","ror":"https://ror.org/04v4g9h31","country_code":"GR","type":"education","lineage":["https://openalex.org/I145722265"]},{"id":"https://openalex.org/I179161674","display_name":"Technological Educational Institute of Central Greece","ror":"https://ror.org/03ed9w591","country_code":"GR","type":"education","lineage":["https://openalex.org/I179161674"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Spiros V. Georgakopoulos","raw_affiliation_strings":["Department of Mathematics, University of Thessaly, 3rd km. Old National Road Lamia-Athens, 35100, Lamia, Greece"],"affiliations":[{"raw_affiliation_string":"Department of Mathematics, University of Thessaly, 3rd km. Old National Road Lamia-Athens, 35100, Lamia, Greece","institution_ids":["https://openalex.org/I145722265","https://openalex.org/I179161674"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039205111","display_name":"Sotiris K. Tasoulis","orcid":"https://orcid.org/0000-0001-9536-4090"},"institutions":[{"id":"https://openalex.org/I145722265","display_name":"University of Thessaly","ror":"https://ror.org/04v4g9h31","country_code":"GR","type":"education","lineage":["https://openalex.org/I145722265"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Sotiris K. Tasoulis","raw_affiliation_strings":["Department of Computer Science and Biomedical \u0399nformatics, University of Thessaly, 2-4 Papasiopoulou Street, 35131, Lamia, Greece"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Biomedical \u0399nformatics, University of Thessaly, 2-4 Papasiopoulou Street, 35131, Lamia, Greece","institution_ids":["https://openalex.org/I145722265"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111235416","display_name":"Vassilis P. Plagianakos","orcid":"https://orcid.org/0000-0002-4266-701X"},"institutions":[{"id":"https://openalex.org/I145722265","display_name":"University of Thessaly","ror":"https://ror.org/04v4g9h31","country_code":"GR","type":"education","lineage":["https://openalex.org/I145722265"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Vassilis P. Plagianakos","raw_affiliation_strings":["Department of Computer Science and Biomedical \u0399nformatics, University of Thessaly, 2-4 Papasiopoulou Street, 35131, Lamia, Greece"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Biomedical \u0399nformatics, University of Thessaly, 2-4 Papasiopoulou Street, 35131, Lamia, Greece","institution_ids":["https://openalex.org/I145722265"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5075066824"],"corresponding_institution_ids":["https://openalex.org/I145722265"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.13768121,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"37","issue":"29","first_page":"24421","last_page":"24439"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computational-science-and-engineering","display_name":"Computational Science and Engineering","score":0.8963869214057922},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.710835337638855},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3675172030925751},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2637595534324646}],"concepts":[{"id":"https://openalex.org/C68597687","wikidata":"https://www.wikidata.org/wiki/Q362601","display_name":"Computational Science and Engineering","level":2,"score":0.8963869214057922},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.710835337638855},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3675172030925751},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2637595534324646}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s00521-025-11593-9","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-025-11593-9","pdf_url":null,"source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s00521-025-11593-9","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-025-11593-9","pdf_url":null,"source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1492327544","https://openalex.org/W1988680150","https://openalex.org/W2048195127","https://openalex.org/W2081699408","https://openalex.org/W2113054345","https://openalex.org/W2129250947","https://openalex.org/W2478540127","https://openalex.org/W2784194212","https://openalex.org/W2963809228","https://openalex.org/W2970641574","https://openalex.org/W3036644138","https://openalex.org/W3041197811","https://openalex.org/W3045464143","https://openalex.org/W3210406624","https://openalex.org/W4306377799","https://openalex.org/W4321610465","https://openalex.org/W4323655724","https://openalex.org/W4366278664","https://openalex.org/W4366378786","https://openalex.org/W4375867312","https://openalex.org/W4385696031","https://openalex.org/W4387321091","https://openalex.org/W4388327657","https://openalex.org/W4389520497","https://openalex.org/W4393247609","https://openalex.org/W4400143066","https://openalex.org/W4400967166","https://openalex.org/W4402364221","https://openalex.org/W4403852924","https://openalex.org/W4404635284"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Abstract":[0],"The":[1,97],"utilization":[2],"of":[3,35,53,61,99,126,155,186,196,214],"large":[4,47,94],"language":[5],"models":[6],"(LLMs)":[7],"in":[8,19,33,59,93],"research":[9],"is":[10,87,102,178],"becoming":[11],"increasingly":[12],"prevalent,":[13],"as":[14],"they":[15],"offer":[16],"advanced":[17],"capabilities":[18,154,213],"processing":[20],"and":[21,37,64,90,164,198,205],"generating":[22],"human-like":[23],"text.":[24],"However,":[25],"this":[26,41,67],"advancement":[27],"comes":[28],"with":[29,50],"a":[30,103,119,124,147,169],"significant":[31],"trade-off":[32],"terms":[34,60],"time":[36,63,204],"computational":[38,184],"costs.":[39],"In":[40,75],"paper,":[42],"we":[43,69,78,135,145],"demonstrate":[44],"that":[45,108,151,176],"analyzing":[46],"text":[48,95],"datasets":[49],"the":[51,71,80,85,110,153,159,183,187,193,210],"use":[52],"LLMs":[54,156,197],"can":[55],"be":[56],"performed":[57],"efficiently":[58],"both":[62],"energy.":[65],"For":[66],"purpose,":[68],"utilize":[70],"Llama":[72],"pre-trained":[73,122],"model.":[74],"more":[76],"detail,":[77],"study":[79],"topic":[81,188],"modeling":[82,189],"task":[83],"where":[84],"goal":[86],"to":[88,157,180,192],"discover":[89],"identify":[91,136],"topics":[92,137,163],"corpora.":[96],"basis":[98],"our":[100],"approach":[101],"hierarchical":[104],"divisive":[105],"clustering":[106],"technique":[107],"clusters":[109],"data":[111,127],"based":[112],"on":[113,123],"their":[114],"semantic":[115],"similarity,":[116],"after":[117],"employing":[118],"Sentence-BERT":[120],"encoder,":[121],"variety":[125],"across":[128],"different":[129],"tasks.":[130],"Then,":[131],"using":[132],"an":[133],"LLM,":[134],"for":[138],"representative":[139],"samples":[140],"from":[141],"each":[142],"cluster.":[143],"Additionally,":[144],"introduce":[146],"new":[148],"evaluation":[149],"method":[150],"leverages":[152],"assess":[158],"alignment":[160],"between":[161],"discovered":[162],"ground":[165],"truth":[166],"labels,":[167],"providing":[168],"robust":[170],"validation":[171],"metric.":[172],"Our":[173],"findings":[174],"indicate":[175],"it":[177],"possible":[179],"effectively":[181],"reduce":[182],"cost":[185],"process":[190],"compared":[191],"direct":[194],"application":[195],"BERTopic,":[199],"while":[200],"simultaneously":[201],"enhancing":[202],"inference":[203],"overall":[206],"efficiency,":[207],"thereby":[208],"surpassing":[209],"current":[211],"state-of-the-art":[212],"BERTopic.":[215]},"counts_by_year":[],"updated_date":"2025-11-18T23:42:31.664661","created_date":"2025-10-10T00:00:00"}
