{"id":"https://openalex.org/W4414878502","doi":"https://doi.org/10.48550/arxiv.2507.17174","title":"GhostUMAP2: Measuring and Analyzing (r,d)-Stability of UMAP","display_name":"GhostUMAP2: Measuring and Analyzing (r,d)-Stability of UMAP","publication_year":2025,"publication_date":"2025-07-23","ids":{"openalex":"https://openalex.org/W4414878502","doi":"https://doi.org/10.48550/arxiv.2507.17174"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2507.17174","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.17174","pdf_url":"https://arxiv.org/pdf/2507.17174","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2507.17174","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102594980","display_name":"Myeongwon Jung","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jung, Myeongwon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Fujiwara, Takanori","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fujiwara, Takanori","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5102959274","display_name":"Jaemin Jo","orcid":"https://orcid.org/0000-0002-5207-6010"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jo, Jaemin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10138","display_name":"Network Traffic and Congestion Control","score":0.9840999841690063,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10138","display_name":"Network Traffic and Congestion Control","score":0.9840999841690063,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11158","display_name":"Wireless Networks and Protocols","score":0.9588000178337097,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12203","display_name":"Mobile Agent-Based Network Management","score":0.9585999846458435,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/projection","display_name":"Projection (relational algebra)","score":0.7736999988555908},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.5364000201225281},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.49239999055862427},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4593000113964081},{"id":"https://openalex.org/keywords/data-point","display_name":"Data point","score":0.4034999907016754},{"id":"https://openalex.org/keywords/stochastic-process","display_name":"Stochastic process","score":0.40230000019073486},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.3853999972343445},{"id":"https://openalex.org/keywords/data-visualization","display_name":"Data visualization","score":0.3833000063896179}],"concepts":[{"id":"https://openalex.org/C57493831","wikidata":"https://www.wikidata.org/wiki/Q3134666","display_name":"Projection (relational algebra)","level":2,"score":0.7736999988555908},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5823000073432922},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.5364000201225281},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.49239999055862427},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4593000113964081},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.447299987077713},{"id":"https://openalex.org/C21080849","wikidata":"https://www.wikidata.org/wiki/Q13611879","display_name":"Data point","level":2,"score":0.4034999907016754},{"id":"https://openalex.org/C8272713","wikidata":"https://www.wikidata.org/wiki/Q176737","display_name":"Stochastic process","level":2,"score":0.40230000019073486},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.3853999972343445},{"id":"https://openalex.org/C172367668","wikidata":"https://www.wikidata.org/wiki/Q6504956","display_name":"Data visualization","level":3,"score":0.3833000063896179},{"id":"https://openalex.org/C529865628","wikidata":"https://www.wikidata.org/wiki/Q1790740","display_name":"Manifold (fluid mechanics)","level":2,"score":0.3547999858856201},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3481000065803528},{"id":"https://openalex.org/C178635117","wikidata":"https://www.wikidata.org/wiki/Q747499","display_name":"RADIUS","level":2,"score":0.34630000591278076},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3131999969482422},{"id":"https://openalex.org/C176250725","wikidata":"https://www.wikidata.org/wiki/Q186386","display_name":"Map projection","level":2,"score":0.3082999885082245},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.30489999055862427},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.2906999886035919},{"id":"https://openalex.org/C151876577","wikidata":"https://www.wikidata.org/wiki/Q7049464","display_name":"Nonlinear dimensionality reduction","level":3,"score":0.29030001163482666},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.28220000863075256},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.28139999508857727},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2791000008583069},{"id":"https://openalex.org/C65557600","wikidata":"https://www.wikidata.org/wiki/Q7249451","display_name":"Projection method","level":3,"score":0.27720001339912415},{"id":"https://openalex.org/C127491075","wikidata":"https://www.wikidata.org/wiki/Q7617825","display_name":"Stochastic modelling","level":2,"score":0.2671000063419342},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2531000077724457},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.25200000405311584}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2507.17174","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.17174","pdf_url":"https://arxiv.org/pdf/2507.17174","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2507.17174","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.17174","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2507.17174","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.17174","pdf_url":"https://arxiv.org/pdf/2507.17174","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Despite":[0],"the":[1,11,19,32,60,67,119,137,173,177,185,192,204],"widespread":[2],"use":[3,206],"of":[4,13,34,63,90,115,127,162,176,179,187,194,196,207],"Uniform":[5],"Manifold":[6],"Approximation":[7],"and":[8,79,199],"Projection":[9],"(UMAP),":[10],"impact":[12,82],"its":[14,109],"stochastic":[15,61,73],"optimization":[16],"process":[17],"on":[18],"results":[20,30],"remains":[21],"underexplored.":[22],"We":[23,100,165],"observed":[24],"that":[25,58,146,171],"it":[26],"often":[27],"produces":[28],"unstable":[29,163],"where":[31],"projections":[33,195],"data":[35,64,91,103,180],"points":[36,65,92],"are":[37],"determined":[38],"mostly":[39],"by":[40,190],"chance":[41],"rather":[42],"than":[43],"reflecting":[44],"neighboring":[45],"structures.":[46],"To":[47,70,134],"address":[48],"this":[49],"limitation,":[50],"we":[51,85,140,183],"introduce":[52,86],"(r,d)-stability":[53,178],"to":[54,98,151,154],"UMAP:":[55],"a":[56,102,113,125,148,168],"framework":[57,189],"analyzes":[59],"positioning":[62],"in":[66,118],"projection":[68,77,105,121],"space.":[69],"assess":[71],"how":[72],"elements,":[74],"specifically":[75],"initial":[76,120],"positions":[78],"negative":[80],"sampling,":[81],"UMAP":[83],"results,":[84],"\"ghosts\",":[87],"or":[88],"duplicates":[89],"representing":[93],"potential":[94],"positional":[95],"variations":[96],"due":[97],"stochasticity.":[99],"define":[101],"point's":[104],"as":[106],"(r,d)-stable":[107],"if":[108],"ghosts":[110],"perturbed":[111],"within":[112,124],"circle":[114,126],"radius":[116,128],"r":[117],"remain":[122],"confined":[123],"d":[129],"for":[130,203],"their":[131],"final":[132],"positions.":[133],"efficiently":[135],"compute":[136],"ghost":[138],"projections,":[139],"develop":[141],"an":[142,155],"adaptive":[143],"dropping":[144],"scheme":[145],"reduces":[147],"runtime":[149],"up":[150],"60%":[152],"compared":[153],"unoptimized":[156],"baseline":[157],"while":[158],"maintaining":[159],"approximately":[160],"90%":[161],"points.":[164,181],"also":[166],"present":[167,200],"visualization":[169],"tool":[170],"supports":[172],"interactive":[174],"exploration":[175],"Finally,":[182],"demonstrate":[184],"effectiveness":[186],"our":[188,208],"examining":[191],"stability":[193],"real-world":[197],"datasets":[198],"usage":[201],"guidelines":[202],"effective":[205],"framework.":[209]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
