{"id":"https://openalex.org/W1982230396","doi":"https://doi.org/10.1198/004017001316975925","title":"Clustering Massive Datasets With Application in Software Metrics and Tomography","display_name":"Clustering Massive Datasets With Application in Software Metrics and Tomography","publication_year":2001,"publication_date":"2001-08-01","ids":{"openalex":"https://openalex.org/W1982230396","doi":"https://doi.org/10.1198/004017001316975925","mag":"1982230396"},"language":"en","primary_location":{"id":"doi:10.1198/004017001316975925","is_oa":false,"landing_page_url":"https://doi.org/10.1198/004017001316975925","pdf_url":null,"source":{"id":"https://openalex.org/S985303","display_name":"Technometrics","issn_l":"0040-1706","issn":["0040-1706","1537-2723"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Technometrics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007920808","display_name":"Ranjan Maitra","orcid":"https://orcid.org/0000-0002-3515-8532"},"institutions":[{"id":"https://openalex.org/I79272384","display_name":"University of Maryland, Baltimore County","ror":"https://ror.org/02qskvh78","country_code":"US","type":"education","lineage":["https://openalex.org/I79272384"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ranjan Maitra","raw_affiliation_strings":["Department of Mathematics and Statistics, University of Maryland, Baltimore County, Baltimore MD 21250","\u00a0 University of Maryland, Baltimore County"],"affiliations":[{"raw_affiliation_string":"Department of Mathematics and Statistics, University of Maryland, Baltimore County, Baltimore MD 21250","institution_ids":["https://openalex.org/I79272384"]},{"raw_affiliation_string":"\u00a0 University of Maryland, Baltimore County","institution_ids":["https://openalex.org/I79272384"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5007920808"],"corresponding_institution_ids":["https://openalex.org/I79272384"],"apc_list":null,"apc_paid":null,"fwci":2.7277,"has_fulltext":false,"cited_by_count":34,"citation_normalized_percentile":{"value":0.90852286,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"43","issue":"3","first_page":"336","last_page":"346"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12205","display_name":"Time Series Analysis and Forecasting","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7286178469657898},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.705980658531189},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.6054357290267944},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.5828057527542114},{"id":"https://openalex.org/keywords/iterated-function","display_name":"Iterated function","score":0.5698227286338806},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.5381345152854919},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.45875075459480286},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.4458004832267761},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4432591497898102},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.42543575167655945},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3455360531806946},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.32795703411102295},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3217094838619232},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.199832946062088},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.08220559358596802},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.05917426943778992}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7286178469657898},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.705980658531189},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.6054357290267944},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.5828057527542114},{"id":"https://openalex.org/C140479938","wikidata":"https://www.wikidata.org/wiki/Q5254619","display_name":"Iterated function","level":2,"score":0.5698227286338806},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.5381345152854919},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.45875075459480286},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.4458004832267761},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4432591497898102},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.42543575167655945},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3455360531806946},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32795703411102295},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3217094838619232},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.199832946062088},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.08220559358596802},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.05917426943778992},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1198/004017001316975925","is_oa":false,"landing_page_url":"https://doi.org/10.1198/004017001316975925","pdf_url":null,"source":{"id":"https://openalex.org/S985303","display_name":"Technometrics","issn_l":"0040-1706","issn":["0040-1706","1537-2723"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Technometrics","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320310207","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W109381222","https://openalex.org/W156509570","https://openalex.org/W632374264","https://openalex.org/W1508357192","https://openalex.org/W1553538755","https://openalex.org/W1975120776","https://openalex.org/W1992724796","https://openalex.org/W2001302965","https://openalex.org/W2002709772","https://openalex.org/W2005803955","https://openalex.org/W2010309065","https://openalex.org/W2013373485","https://openalex.org/W2028888440","https://openalex.org/W2033403400","https://openalex.org/W2050986127","https://openalex.org/W2051728439","https://openalex.org/W2053718475","https://openalex.org/W2064903690","https://openalex.org/W2068640436","https://openalex.org/W2071316194","https://openalex.org/W2077982583","https://openalex.org/W2082503527","https://openalex.org/W2082576445","https://openalex.org/W2085080020","https://openalex.org/W2085572798","https://openalex.org/W2086943813","https://openalex.org/W2090203522","https://openalex.org/W2097224648","https://openalex.org/W2125334673","https://openalex.org/W2133367958","https://openalex.org/W2325346015","https://openalex.org/W2333283264","https://openalex.org/W2612166593","https://openalex.org/W2801345297","https://openalex.org/W2913066018","https://openalex.org/W4237058027","https://openalex.org/W4242073520","https://openalex.org/W4244030505","https://openalex.org/W4246037734","https://openalex.org/W4390545247"],"related_works":["https://openalex.org/W3103325625","https://openalex.org/W1486898455","https://openalex.org/W3090727460","https://openalex.org/W2041905724","https://openalex.org/W2047986527","https://openalex.org/W4306313719","https://openalex.org/W3128682647","https://openalex.org/W2804364458","https://openalex.org/W2991463004","https://openalex.org/W4298130764"],"abstract_inverted_index":{"AbstractClustering":[0],"datasets":[1,76],"is":[2,12,95],"not":[3],"an":[4,28],"easy":[5],"problem":[6],"in":[7,64],"general,":[8],"and":[9,42,58,80],"the":[10,44,48,54,65,93],"difficulty":[11],"compounded":[13],"for":[14],"massive":[15],"datasets.":[16],"This":[17],"article":[18],"develops,":[19],"under":[20],"Gaussian":[21,101],"assumptions,":[22],"a":[23],"multistage":[24],"algorithm":[25],"that":[26,34,92],"clusters":[27],"initial":[29],"sample,":[30],"filters":[31],"out":[32],"observations":[33],"can":[35],"be":[36],"reasonably":[37],"classified":[38],"by":[39],"these":[40],"clusters,":[41],"iterates":[43],"preceding":[45],"procedure":[46,94],"on":[47,68],"remainder.":[49],"A":[50],"final":[51],"step":[52],"uses":[53],"estimated":[55],"class":[56],"probabilities":[57],"dispersions":[59],"to":[60,75,97],"classify":[61],"each":[62],"observation":[63],"dataset.":[66],"Results":[67],"test":[69],"experiments":[70],"indicate":[71],"good":[72],"performance.":[73],"Application":[74],"from":[77],"software":[78],"metrics":[79],"positron":[81],"emission":[82],"tomography":[83],"required":[84],"no":[85],"more":[86],"than":[87],"five":[88],"stages":[89],"each,":[90],"suggesting":[91],"practical":[96],"implement.KEY":[98],"WORDS":[99],":":[100],"distributionLikelihood":[102],"ratio":[103],"testMultistage":[104],"procedureSample":[105]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":2},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
