{"id":"https://openalex.org/W4387885660","doi":"https://doi.org/10.1109/tvcg.2023.3326569","title":"Large-Scale Evaluation of Topic Models and Dimensionality Reduction Methods for 2D Text Spatialization","display_name":"Large-Scale Evaluation of Topic Models and Dimensionality Reduction Methods for 2D Text Spatialization","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4387885660","doi":"https://doi.org/10.1109/tvcg.2023.3326569","pmid":"https://pubmed.ncbi.nlm.nih.gov/37871085"},"language":"en","primary_location":{"id":"doi:10.1109/tvcg.2023.3326569","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvcg.2023.3326569","pdf_url":null,"source":{"id":"https://openalex.org/S84775595","display_name":"IEEE Transactions on Visualization and Computer Graphics","issn_l":"1077-2626","issn":["1077-2626","1941-0506","2160-9306"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Visualization and Computer Graphics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056962479","display_name":"Daniel Atzberger","orcid":null},"institutions":[{"id":"https://openalex.org/I176453806","display_name":"University of Potsdam","ror":"https://ror.org/03bnmw459","country_code":"DE","type":"education","lineage":["https://openalex.org/I176453806"]},{"id":"https://openalex.org/I143288331","display_name":"Hasso Plattner Institute","ror":"https://ror.org/058rn5r42","country_code":"DE","type":"facility","lineage":["https://openalex.org/I143288331","https://openalex.org/I176453806"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Daniel Atzberger","raw_affiliation_strings":["Digital Engineering Faculty, Hasso Plattner Institute, University of Potsdam, Germany"],"affiliations":[{"raw_affiliation_string":"Digital Engineering Faculty, Hasso Plattner Institute, University of Potsdam, Germany","institution_ids":["https://openalex.org/I143288331","https://openalex.org/I176453806"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008071697","display_name":"Tim Cech","orcid":"https://orcid.org/0000-0001-8688-2419"},"institutions":[{"id":"https://openalex.org/I176453806","display_name":"University of Potsdam","ror":"https://ror.org/03bnmw459","country_code":"DE","type":"education","lineage":["https://openalex.org/I176453806"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Tim Cech","raw_affiliation_strings":["Digital Engineering Faculty, University of Potsdam, Germany"],"affiliations":[{"raw_affiliation_string":"Digital Engineering Faculty, University of Potsdam, Germany","institution_ids":["https://openalex.org/I176453806"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090346908","display_name":"Matthias Trapp","orcid":"https://orcid.org/0000-0003-3861-5759"},"institutions":[{"id":"https://openalex.org/I176453806","display_name":"University of Potsdam","ror":"https://ror.org/03bnmw459","country_code":"DE","type":"education","lineage":["https://openalex.org/I176453806"]},{"id":"https://openalex.org/I143288331","display_name":"Hasso Plattner Institute","ror":"https://ror.org/058rn5r42","country_code":"DE","type":"facility","lineage":["https://openalex.org/I143288331","https://openalex.org/I176453806"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Matthias Trapp","raw_affiliation_strings":["Digital Engineering Faculty, Hasso Plattner Institute, University of Potsdam, Germany"],"affiliations":[{"raw_affiliation_string":"Digital Engineering Faculty, Hasso Plattner Institute, University of Potsdam, Germany","institution_ids":["https://openalex.org/I143288331","https://openalex.org/I176453806"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035885351","display_name":"Rico Richter","orcid":"https://orcid.org/0000-0001-5523-3694"},"institutions":[{"id":"https://openalex.org/I176453806","display_name":"University of Potsdam","ror":"https://ror.org/03bnmw459","country_code":"DE","type":"education","lineage":["https://openalex.org/I176453806"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Rico Richter","raw_affiliation_strings":["Digital Engineering Faculty, University of Potsdam, Germany"],"affiliations":[{"raw_affiliation_string":"Digital Engineering Faculty, University of Potsdam, Germany","institution_ids":["https://openalex.org/I176453806"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052710697","display_name":"Willy Scheibel","orcid":"https://orcid.org/0000-0002-7885-9857"},"institutions":[{"id":"https://openalex.org/I143288331","display_name":"Hasso Plattner Institute","ror":"https://ror.org/058rn5r42","country_code":"DE","type":"facility","lineage":["https://openalex.org/I143288331","https://openalex.org/I176453806"]},{"id":"https://openalex.org/I176453806","display_name":"University of Potsdam","ror":"https://ror.org/03bnmw459","country_code":"DE","type":"education","lineage":["https://openalex.org/I176453806"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Willy Scheibel","raw_affiliation_strings":["Digital Engineering Faculty, Hasso Plattner Institute, University of Potsdam, Germany"],"affiliations":[{"raw_affiliation_string":"Digital Engineering Faculty, Hasso Plattner Institute, University of Potsdam, Germany","institution_ids":["https://openalex.org/I143288331","https://openalex.org/I176453806"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081246092","display_name":"J\u00fcrgen D\u00f6llner","orcid":null},"institutions":[{"id":"https://openalex.org/I176453806","display_name":"University of Potsdam","ror":"https://ror.org/03bnmw459","country_code":"DE","type":"education","lineage":["https://openalex.org/I176453806"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Jurgen D\u00f6llner","raw_affiliation_strings":["Digital Engineering Faculty, University of Potsdam, Germany"],"affiliations":[{"raw_affiliation_string":"Digital Engineering Faculty, University of Potsdam, Germany","institution_ids":["https://openalex.org/I176453806"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016219620","display_name":"Tobias Schreck","orcid":"https://orcid.org/0000-0003-0778-8665"},"institutions":[{"id":"https://openalex.org/I4092182","display_name":"Graz University of Technology","ror":"https://ror.org/00d7xrm67","country_code":"AT","type":"education","lineage":["https://openalex.org/I4092182"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Tobias Schreck","raw_affiliation_strings":["Graz University of Technology, Austria"],"affiliations":[{"raw_affiliation_string":"Graz University of Technology, Austria","institution_ids":["https://openalex.org/I4092182"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5056962479"],"corresponding_institution_ids":["https://openalex.org/I143288331","https://openalex.org/I176453806"],"apc_list":null,"apc_paid":null,"fwci":1.219,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.81856915,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"30","issue":"1","first_page":"1","last_page":"11"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9866999983787537,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8042201995849609},{"id":"https://openalex.org/keywords/dimensionality-reduction","display_name":"Dimensionality reduction","score":0.7064290046691895},{"id":"https://openalex.org/keywords/spatialization","display_name":"Spatialization","score":0.5932772159576416},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.5816372632980347},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.576852560043335},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5682401061058044},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.5239591598510742},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5118665099143982},{"id":"https://openalex.org/keywords/text-corpus","display_name":"Text corpus","score":0.4506509602069855},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.43660280108451843},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.42679840326309204},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3412795066833496},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3306256830692291}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8042201995849609},{"id":"https://openalex.org/C70518039","wikidata":"https://www.wikidata.org/wiki/Q16000077","display_name":"Dimensionality reduction","level":2,"score":0.7064290046691895},{"id":"https://openalex.org/C2777031145","wikidata":"https://www.wikidata.org/wiki/Q4430987","display_name":"Spatialization","level":2,"score":0.5932772159576416},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.5816372632980347},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.576852560043335},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5682401061058044},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.5239591598510742},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5118665099143982},{"id":"https://openalex.org/C2474386","wikidata":"https://www.wikidata.org/wiki/Q461183","display_name":"Text corpus","level":2,"score":0.4506509602069855},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.43660280108451843},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.42679840326309204},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3412795066833496},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3306256830692291},{"id":"https://openalex.org/C19165224","wikidata":"https://www.wikidata.org/wiki/Q23404","display_name":"Anthropology","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tvcg.2023.3326569","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvcg.2023.3326569","pdf_url":null,"source":{"id":"https://openalex.org/S84775595","display_name":"IEEE Transactions on Visualization and Computer Graphics","issn_l":"1077-2626","issn":["1077-2626","1941-0506","2160-9306"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Visualization and Computer Graphics","raw_type":"journal-article"},{"id":"pmid:37871085","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/37871085","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on visualization and computer graphics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":82,"referenced_works":["https://openalex.org/W40976687","https://openalex.org/W1571401318","https://openalex.org/W1596936080","https://openalex.org/W1826790618","https://openalex.org/W1902027874","https://openalex.org/W1927933524","https://openalex.org/W1928219753","https://openalex.org/W1951518548","https://openalex.org/W1987971958","https://openalex.org/W1990995255","https://openalex.org/W2001542951","https://openalex.org/W2012521459","https://openalex.org/W2015755066","https://openalex.org/W2038043464","https://openalex.org/W2051224630","https://openalex.org/W2051767208","https://openalex.org/W2078526387","https://openalex.org/W2085487226","https://openalex.org/W2086461919","https://openalex.org/W2087382273","https://openalex.org/W2104766360","https://openalex.org/W2115891846","https://openalex.org/W2119452648","https://openalex.org/W2128554541","https://openalex.org/W2133205243","https://openalex.org/W2136435231","https://openalex.org/W2137570937","https://openalex.org/W2147152072","https://openalex.org/W2160170318","https://openalex.org/W2162825485","https://openalex.org/W2164961799","https://openalex.org/W2184914077","https://openalex.org/W2187089797","https://openalex.org/W2187358498","https://openalex.org/W2218641061","https://openalex.org/W2238545866","https://openalex.org/W2395911969","https://openalex.org/W2512177572","https://openalex.org/W2610962473","https://openalex.org/W2786672974","https://openalex.org/W2797565035","https://openalex.org/W2807795618","https://openalex.org/W2815307792","https://openalex.org/W2887683504","https://openalex.org/W2943857514","https://openalex.org/W2947771069","https://openalex.org/W2966135715","https://openalex.org/W2975605169","https://openalex.org/W3027472289","https://openalex.org/W3042697744","https://openalex.org/W3042939456","https://openalex.org/W3046717556","https://openalex.org/W3048251905","https://openalex.org/W3094279873","https://openalex.org/W3099514962","https://openalex.org/W3131125794","https://openalex.org/W3138819813","https://openalex.org/W3176479810","https://openalex.org/W3177269615","https://openalex.org/W3184973310","https://openalex.org/W3204809439","https://openalex.org/W4212827234","https://openalex.org/W4239908238","https://openalex.org/W4245882257","https://openalex.org/W4254491045","https://openalex.org/W4297461125","https://openalex.org/W4297461362","https://openalex.org/W4297817021","https://openalex.org/W4300113520","https://openalex.org/W4312686527","https://openalex.org/W4315836531","https://openalex.org/W6601161491","https://openalex.org/W6675301171","https://openalex.org/W6686785280","https://openalex.org/W6697071071","https://openalex.org/W6748816842","https://openalex.org/W6755207826","https://openalex.org/W6762996673","https://openalex.org/W6766471253","https://openalex.org/W6780486361","https://openalex.org/W6782149786","https://openalex.org/W6853824374"],"related_works":["https://openalex.org/W1995622179","https://openalex.org/W1484111231","https://openalex.org/W1552543208","https://openalex.org/W2074396517","https://openalex.org/W2166963679","https://openalex.org/W2187269125","https://openalex.org/W1641615907","https://openalex.org/W3089231081","https://openalex.org/W2093956241","https://openalex.org/W2354420595"],"abstract_inverted_index":{"Topic":[0],"models":[1,26,92,138,229,242],"are":[2,134,153,225,243],"a":[3,15,20,113,123,128,164,192,197,234,260],"class":[4],"of":[5,53,90,100,121,125,130,136,173,182,221,249,257],"unsupervised":[6],"learning":[7],"algorithms":[8,132],"for":[9,30,33,97,108,146,217,245],"detecting":[10],"the":[11,44,51,54,57,66,88,98,148,171,179,183,189,212,218,247,255],"semantic":[12,41],"structure":[13,248],"within":[14],"text":[16,34,222,250],"corpus.":[17],"Together":[18],"with":[19,79,200],"subsequent":[21,261],"dimensionality":[22,58,94,140,231,262],"reduction":[23,95],"algorithm,":[24],"topic":[25,55,91,137,228,241],"can":[27],"be":[28],"used":[29],"deriving":[31],"spatializations":[32,223],"corpora":[35,101,152],"as":[36,102,155,259],"two-dimensional":[37,103,184],"scatter":[38,104,185],"plots,":[39],"reflecting":[40],"similarity":[42],"between":[43],"documents":[45],"and":[46,60,83,93,139,142,158,175,178,206,230],"supporting":[47],"corpus":[48],"analysis.":[49],"Although":[50],"choice":[52],"model,":[56],"reduction,":[59],"their":[61],"underlying":[62],"hyperparameters":[63],"significantly":[64],"impact":[65],"resulting":[67,149],"layout,":[68],"it":[69],"is":[70,161],"unknown":[71],"which":[72],"particular":[73],"combinations":[74,135],"result":[75],"in":[76],"high-quality":[77],"layouts":[78,205],"respect":[80],"to":[81,163],"accuracy":[82],"perception":[84],"metrics.":[85,209],"To":[86],"investigate":[87],"effectiveness":[89,181],"methods":[96],"spatialization":[99],"plots":[105],"(or":[106],"basis":[107],"landscape-type":[109],"visualizations),":[110],"we":[111,195,214,237],"present":[112],"large-scale,":[114],"benchmark-based":[115],"computational":[116],"evaluation.":[117],"Our":[118],"evaluation":[119],"consists":[120],"(1)":[122],"set":[124,129],"corpora,":[126],"(2)":[127],"layout":[131],"that":[133,224,239],"reductions,":[141],"(3)":[143],"quality":[144,208],"metrics":[145,169],"quantifying":[147],"layout.":[150],"The":[151,167],"given":[154],"document-term":[156],"matrices,":[157],"each":[159],"document":[160],"assigned":[162],"thematic":[165],"class.":[166],"chosen":[168],"quantify":[170],"preservation":[172],"local":[174],"global":[176],"properties":[177],"perceptual":[180],"plots.":[186],"By":[187],"evaluating":[188],"benchmark":[190],"on":[191,211,227],"computing":[193],"cluster,":[194],"derived":[196],"multivariate":[198],"dataset":[199],"over":[201],"45":[202],"000":[203],"individual":[204],"corresponding":[207],"Based":[210],"results,":[213],"propose":[215],"guidelines":[216],"effective":[219],"design":[220],"based":[226],"reductions.":[232],"As":[233],"main":[235],"result,":[236],"show":[238],"interpretable":[240],"beneficial":[244],"capturing":[246],"corpora.":[251],"We":[252],"furthermore":[253],"recommend":[254],"use":[256],"t-SNE":[258],"reduction.":[263]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":5}],"updated_date":"2026-03-17T09:09:15.849793","created_date":"2025-10-10T00:00:00"}
