{"id":"https://openalex.org/W4220870389","doi":"https://doi.org/10.1007/s11192-022-04318-5","title":"Validation of scientific topic models using graph analysis and corpus metadata","display_name":"Validation of scientific topic models using graph analysis and corpus metadata","publication_year":2022,"publication_date":"2022-03-30","ids":{"openalex":"https://openalex.org/W4220870389","doi":"https://doi.org/10.1007/s11192-022-04318-5"},"language":"en","primary_location":{"id":"doi:10.1007/s11192-022-04318-5","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11192-022-04318-5","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11192-022-04318-5.pdf","source":{"id":"https://openalex.org/S148561398","display_name":"Scientometrics","issn_l":"0138-9130","issn":["0138-9130","1588-2861"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320108","host_organization_name":"Springer Nature (Netherlands)","host_organization_lineage":["https://openalex.org/P4310320108","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature (Netherlands)","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Scientometrics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s11192-022-04318-5.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036862156","display_name":"Manuel A. V\u00e1zquez","orcid":"https://orcid.org/0000-0003-3365-2622"},"institutions":[{"id":"https://openalex.org/I50357001","display_name":"Universidad Carlos III de Madrid","ror":"https://ror.org/03ths8210","country_code":"ES","type":"education","lineage":["https://openalex.org/I50357001"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Manuel A. V\u00e1zquez","raw_affiliation_strings":["Universidad Carlos III de Madrid, Madrid, Spain"],"raw_orcid":"https://orcid.org/0000-0003-3365-2622","affiliations":[{"raw_affiliation_string":"Universidad Carlos III de Madrid, Madrid, Spain","institution_ids":["https://openalex.org/I50357001"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053479617","display_name":"Jorge Pereira-Delgado","orcid":null},"institutions":[{"id":"https://openalex.org/I50357001","display_name":"Universidad Carlos III de Madrid","ror":"https://ror.org/03ths8210","country_code":"ES","type":"education","lineage":["https://openalex.org/I50357001"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Jorge Pereira-Delgado","raw_affiliation_strings":["Universidad Carlos III de Madrid, Madrid, Spain"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universidad Carlos III de Madrid, Madrid, Spain","institution_ids":["https://openalex.org/I50357001"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030068883","display_name":"Jes\u00fas Cid\u2010Sueiro","orcid":"https://orcid.org/0000-0002-5243-5992"},"institutions":[{"id":"https://openalex.org/I50357001","display_name":"Universidad Carlos III de Madrid","ror":"https://ror.org/03ths8210","country_code":"ES","type":"education","lineage":["https://openalex.org/I50357001"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Jes\u00fas Cid-Sueiro","raw_affiliation_strings":["Universidad Carlos III de Madrid, Madrid, Spain"],"raw_orcid":"https://orcid.org/0000-0002-5243-5992","affiliations":[{"raw_affiliation_string":"Universidad Carlos III de Madrid, Madrid, Spain","institution_ids":["https://openalex.org/I50357001"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046086664","display_name":"Jer\u00f3nimo Arenas\u2010Garc\u00eda","orcid":"https://orcid.org/0000-0003-4071-7068"},"institutions":[{"id":"https://openalex.org/I50357001","display_name":"Universidad Carlos III de Madrid","ror":"https://ror.org/03ths8210","country_code":"ES","type":"education","lineage":["https://openalex.org/I50357001"]}],"countries":["ES"],"is_corresponding":true,"raw_author_name":"Jer\u00f3nimo Arenas-Garc\u00eda","raw_affiliation_strings":["Universidad Carlos III de Madrid, Madrid, Spain"],"raw_orcid":"https://orcid.org/0000-0003-4071-7068","affiliations":[{"raw_affiliation_string":"Universidad Carlos III de Madrid, Madrid, Spain","institution_ids":["https://openalex.org/I50357001"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5046086664"],"corresponding_institution_ids":["https://openalex.org/I50357001"],"apc_list":{"value":2290,"currency":"EUR","value_usd":2890},"apc_paid":{"value":2290,"currency":"EUR","value_usd":2890},"fwci":10.5517,"has_fulltext":true,"cited_by_count":14,"citation_normalized_percentile":{"value":0.98150224,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"127","issue":"9","first_page":"5441","last_page":"5458"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9817000031471252,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/latent-dirichlet-allocation","display_name":"Latent Dirichlet allocation","score":0.8370825052261353},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8065065145492554},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.7652713060379028},{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.6786566972732544},{"id":"https://openalex.org/keywords/hyperparameter","display_name":"Hyperparameter","score":0.6440882682800293},{"id":"https://openalex.org/keywords/perplexity","display_name":"Perplexity","score":0.5631051063537598},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5110350847244263},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5022573471069336},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.46952763199806213},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.4576624035835266},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.441069632768631},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.4290268123149872},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3247619867324829},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.29057595133781433},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.25744208693504333},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.25611454248428345},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.11422368884086609}],"concepts":[{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.8370825052261353},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8065065145492554},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.7652713060379028},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.6786566972732544},{"id":"https://openalex.org/C8642999","wikidata":"https://www.wikidata.org/wiki/Q4171168","display_name":"Hyperparameter","level":2,"score":0.6440882682800293},{"id":"https://openalex.org/C100279451","wikidata":"https://www.wikidata.org/wiki/Q372193","display_name":"Perplexity","level":3,"score":0.5631051063537598},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5110350847244263},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5022573471069336},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.46952763199806213},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.4576624035835266},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.441069632768631},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.4290268123149872},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3247619867324829},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.29057595133781433},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.25744208693504333},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.25611454248428345},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.11422368884086609},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1007/s11192-022-04318-5","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11192-022-04318-5","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11192-022-04318-5.pdf","source":{"id":"https://openalex.org/S148561398","display_name":"Scientometrics","issn_l":"0138-9130","issn":["0138-9130","1588-2861"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320108","host_organization_name":"Springer Nature (Netherlands)","host_organization_lineage":["https://openalex.org/P4310320108","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature (Netherlands)","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Scientometrics","raw_type":"journal-article"},{"id":"pmh:oai:e-archivo.uc3m.es:10016/38468","is_oa":true,"landing_page_url":"http://hdl.handle.net/10016/38468","pdf_url":"https://e-archivo.uc3m.es/bitstreams/bd1070e8-95e5-4afd-bc00-3c07f55d3116/download","source":{"id":"https://openalex.org/S4306400817","display_name":"e-Archivo (Carlos III University of Madrid)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I50357001","host_organization_name":"Universidad Carlos III de Madrid","host_organization_lineage":["https://openalex.org/I50357001"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"research article"},{"id":"pmh:oai:RePEc:spr:scient:v:127:y:2022:i:9:d:10.1007_s11192-022-04318-5","is_oa":false,"landing_page_url":"http://link.springer.com/10.1007/s11192-022-04318-5","pdf_url":null,"source":{"id":"https://openalex.org/S4306401271","display_name":"RePEc: Research Papers in Economics","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I77793887","host_organization_name":"Federal Reserve Bank of St. Louis","host_organization_lineage":["https://openalex.org/I77793887"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.1007/s11192-022-04318-5","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11192-022-04318-5","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11192-022-04318-5.pdf","source":{"id":"https://openalex.org/S148561398","display_name":"Scientometrics","issn_l":"0138-9130","issn":["0138-9130","1588-2861"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320108","host_organization_name":"Springer Nature (Netherlands)","host_organization_lineage":["https://openalex.org/P4310320108","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature (Netherlands)","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Scientometrics","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.6700000166893005,"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9"}],"awards":[{"id":"https://openalex.org/G5204345448","display_name":null,"funder_award_id":"TEC2017-83838-R","funder_id":"https://openalex.org/F4320315062","funder_display_name":"Ministerio de Ciencia, Innovaci\u00f3n y Universidades"},{"id":"https://openalex.org/G5789747333","display_name":null,"funder_award_id":"101004870","funder_id":"https://openalex.org/F4320332999","funder_display_name":"Horizon 2020 Framework Programme"},{"id":"https://openalex.org/G7328098333","display_name":"A Competitive Intelligence Cloud/HPC Platform for AI-based STI Policy Making","funder_award_id":"101004870","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"}],"funders":[{"id":"https://openalex.org/F4320315062","display_name":"Ministerio de Ciencia, Innovaci\u00f3n y Universidades","ror":null},{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320332999","display_name":"Horizon 2020 Framework Programme","ror":"https://ror.org/00k4n6c32"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4220870389.pdf","grobid_xml":"https://content.openalex.org/works/W4220870389.grobid-xml"},"referenced_works_count":33,"referenced_works":["https://openalex.org/W146900863","https://openalex.org/W1920845339","https://openalex.org/W1973867393","https://openalex.org/W2025365931","https://openalex.org/W2038043464","https://openalex.org/W2150731624","https://openalex.org/W2162317738","https://openalex.org/W2251463950","https://openalex.org/W2296760094","https://openalex.org/W2587676558","https://openalex.org/W2751976275","https://openalex.org/W2782303220","https://openalex.org/W2790855988","https://openalex.org/W2801930304","https://openalex.org/W2806298290","https://openalex.org/W2888241476","https://openalex.org/W2912176745","https://openalex.org/W2924920807","https://openalex.org/W2955389955","https://openalex.org/W2963459858","https://openalex.org/W2979907219","https://openalex.org/W2983594740","https://openalex.org/W2991320433","https://openalex.org/W3021751881","https://openalex.org/W3038847629","https://openalex.org/W3048633946","https://openalex.org/W3062383798","https://openalex.org/W3092336047","https://openalex.org/W3104077627","https://openalex.org/W3120784508","https://openalex.org/W4245803912","https://openalex.org/W6600313733","https://openalex.org/W6639619044"],"related_works":["https://openalex.org/W2769501189","https://openalex.org/W4315588616","https://openalex.org/W4312773271","https://openalex.org/W2761847515","https://openalex.org/W130869231","https://openalex.org/W2888805565","https://openalex.org/W2962686197","https://openalex.org/W4293734197","https://openalex.org/W4206967254","https://openalex.org/W2131689821"],"abstract_inverted_index":{"Abstract":[0],"Probabilistic":[1],"topic":[2,45,96,134,222,238],"modeling":[3],"algorithms":[4],"like":[5,66],"Latent":[6],"Dirichlet":[7],"Allocation":[8],"(LDA)":[9],"have":[10],"become":[11],"powerful":[12],"tools":[13],"for":[14,47,117,163,191],"the":[15,53,56,74,86,89,95,106,118,128,133,146,149,152,161,168,171,175,178,182,192,207,215,228,244],"analysis":[16,104,255],"of":[17,20,55,76,88,108,120,151,160,167,217,247,250],"large":[18],"collections":[19],"documents":[21],"(such":[22],"as":[23],"papers,":[24],"projects,":[25],"or":[26,68],"funding":[27],"applications)":[28],"in":[29,83,252],"science,":[30],"technology":[31],"an":[32,41],"innovation":[33],"(STI)":[34],"policy":[35,254],"design":[36],"and":[37,43,185,219,256],"monitoring.":[38],"However,":[39],"selecting":[40],"appropriate":[42],"stable":[44],"model":[46,97,184],"a":[48,60,80,114,164],"specific":[49],"application":[50],"(by":[51],"adjusting":[52],"hyperparameters":[54,121],"algorithm)":[57],"is":[58,98,111,123,204],"not":[59,79],"trivial":[61],"problem.":[62],"Common":[63],"validation":[64],"metrics":[65,130,209],"coherence":[67],"perplexity,":[69],"which":[70,122,232],"are":[71,78,225],"focused":[72],"on":[73,102,197],"quality":[75,87],"topics,":[77],"good":[81],"fit":[82],"applications":[84],"where":[85],"document":[90],"similarity":[91,129,153],"relations":[92],"inferred":[93],"from":[94,132,157,181],"especially":[99],"relevant.":[100],"Relying":[101],"graph":[103,144,179],"techniques,":[105],"aim":[107],"our":[109],"work":[110],"to":[112,126,138,201,213,236],"state":[113],"new":[115],"methodology":[116],"selection":[119],"specifically":[124],"oriented":[125],"optimize":[127],"emanating":[131],"model.":[135],"In":[136],"order":[137],"do":[139],"this,":[140],"we":[141],"propose":[142],"two":[143],"metrics:":[145],"first":[147],"measures":[148,174],"variability":[150],"graphs":[154],"that":[155,206,224],"result":[156],"different":[158],"runs":[159],"algorithm":[162],"fixed":[165],"value":[166],"hyperparameters,":[169],"while":[170],"second":[172],"metric":[173],"alignment":[176],"between":[177],"derived":[180],"LDA":[183],"another":[186],"obtained":[187],"using":[188],"metadata":[189],"available":[190],"corresponding":[193],"corpus.":[194],"Through":[195],"experiments":[196],"various":[198],"corpora":[199],"related":[200],"STI,":[202],"it":[203],"shown":[205],"proposed":[208],"provide":[210],"relevant":[211],"indicators":[212],"select":[214],"number":[216],"topics":[218],"build":[220],"persistent":[221],"models":[223,239],"consistent":[226],"with":[227],"metadata.":[229],"Their":[230],"use,":[231],"can":[233],"be":[234],"extended":[235],"other":[237],"beyond":[240],"LDA,":[241],"could":[242],"facilitate":[243],"systematic":[245],"adoption":[246],"this":[248],"kind":[249],"techniques":[251],"STI":[253],"design.":[257]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":4}],"updated_date":"2026-06-22T08:00:12.763002","created_date":"2022-04-03T00:00:00"}
