{"id":"https://openalex.org/W2094324273","doi":"https://doi.org/10.1109/grc.2005.1547264","title":"Semantic based clustering of Web documents","display_name":"Semantic based clustering of Web documents","publication_year":2005,"publication_date":"2005-01-01","ids":{"openalex":"https://openalex.org/W2094324273","doi":"https://doi.org/10.1109/grc.2005.1547264","mag":"2094324273"},"language":"en","primary_location":{"id":"doi:10.1109/grc.2005.1547264","is_oa":false,"landing_page_url":"https://doi.org/10.1109/grc.2005.1547264","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2005 IEEE International Conference on Granular Computing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5065383216","display_name":"T. Lin","orcid":"https://orcid.org/0009-0000-7432-0718"},"institutions":[{"id":"https://openalex.org/I51504820","display_name":"San Jose State University","ror":"https://ror.org/04qyvz380","country_code":"US","type":"education","lineage":["https://openalex.org/I51504820"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"T.Y. Lin","raw_affiliation_strings":["Department of Computer Science, San Jose State University Foundation, USA","Department of Computer Science, San Jose State Univ., CA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, San Jose State University Foundation, USA","institution_ids":["https://openalex.org/I51504820"]},{"raw_affiliation_string":"Department of Computer Science, San Jose State Univ., CA, USA","institution_ids":["https://openalex.org/I51504820"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110147547","display_name":"I\u2010Jen Chiang","orcid":null},"institutions":[{"id":"https://openalex.org/I47519274","display_name":"Taipei Medical University","ror":"https://ror.org/05031qk94","country_code":"TW","type":"education","lineage":["https://openalex.org/I47519274"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"I-Jen Chiang","raw_affiliation_strings":["Graduate Institute of Medical Informatics, Taipei Medical University, Taiwan","Taipei Medical University"],"affiliations":[{"raw_affiliation_string":"Graduate Institute of Medical Informatics, Taipei Medical University, Taiwan","institution_ids":["https://openalex.org/I47519274"]},{"raw_affiliation_string":"Taipei Medical University","institution_ids":["https://openalex.org/I47519274"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5065383216"],"corresponding_institution_ids":["https://openalex.org/I51504820"],"apc_list":null,"apc_paid":null,"fwci":0.3179,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.57367159,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"26","issue":null,"first_page":"189","last_page":"192 Vol. 1"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7788839340209961},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7645617723464966},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.6258477568626404},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6183853149414062},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.44805359840393066},{"id":"https://openalex.org/keywords/hierarchical-clustering","display_name":"Hierarchical clustering","score":0.42936769127845764},{"id":"https://openalex.org/keywords/conceptual-clustering","display_name":"Conceptual clustering","score":0.42108261585235596},{"id":"https://openalex.org/keywords/brown-clustering","display_name":"Brown clustering","score":0.41524872183799744},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.41495534777641296},{"id":"https://openalex.org/keywords/fuzzy-clustering","display_name":"Fuzzy clustering","score":0.344552218914032},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3246244192123413},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32111313939094543},{"id":"https://openalex.org/keywords/canopy-clustering-algorithm","display_name":"Canopy clustering algorithm","score":0.24196696281433105},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14176839590072632},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.1109113097190857},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.06965842843055725}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7788839340209961},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7645617723464966},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.6258477568626404},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6183853149414062},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.44805359840393066},{"id":"https://openalex.org/C92835128","wikidata":"https://www.wikidata.org/wiki/Q1277447","display_name":"Hierarchical clustering","level":3,"score":0.42936769127845764},{"id":"https://openalex.org/C39235581","wikidata":"https://www.wikidata.org/wiki/Q5158434","display_name":"Conceptual clustering","level":5,"score":0.42108261585235596},{"id":"https://openalex.org/C167984511","wikidata":"https://www.wikidata.org/wiki/Q17003931","display_name":"Brown clustering","level":5,"score":0.41524872183799744},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.41495534777641296},{"id":"https://openalex.org/C17212007","wikidata":"https://www.wikidata.org/wiki/Q5511111","display_name":"Fuzzy clustering","level":3,"score":0.344552218914032},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3246244192123413},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32111313939094543},{"id":"https://openalex.org/C104047586","wikidata":"https://www.wikidata.org/wiki/Q5033439","display_name":"Canopy clustering algorithm","level":4,"score":0.24196696281433105},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14176839590072632},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.1109113097190857},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.06965842843055725},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/grc.2005.1547264","is_oa":false,"landing_page_url":"https://doi.org/10.1109/grc.2005.1547264","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2005 IEEE International Conference on Granular Computing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W110443600","https://openalex.org/W1484413656","https://openalex.org/W1490467896","https://openalex.org/W1507051419","https://openalex.org/W1524704912","https://openalex.org/W1543250017","https://openalex.org/W1546274087","https://openalex.org/W1548802052","https://openalex.org/W1601717103","https://openalex.org/W1663435917","https://openalex.org/W1918870341","https://openalex.org/W1956559956","https://openalex.org/W1971784203","https://openalex.org/W1978394996","https://openalex.org/W1989993068","https://openalex.org/W1995872006","https://openalex.org/W1996764654","https://openalex.org/W1997841190","https://openalex.org/W2010652031","https://openalex.org/W2037965136","https://openalex.org/W2054119298","https://openalex.org/W2054624705","https://openalex.org/W2066636486","https://openalex.org/W2080301338","https://openalex.org/W2081980673","https://openalex.org/W2082729696","https://openalex.org/W2095150974","https://openalex.org/W2100958137","https://openalex.org/W2118020653","https://openalex.org/W2120970098","https://openalex.org/W2127218421","https://openalex.org/W2129530648","https://openalex.org/W2138656431","https://openalex.org/W2144212226","https://openalex.org/W2144481322","https://openalex.org/W2149892594","https://openalex.org/W2153028052","https://openalex.org/W2154638710","https://openalex.org/W2160368903","https://openalex.org/W2166559705","https://openalex.org/W2325227998","https://openalex.org/W2474187693","https://openalex.org/W2500846359","https://openalex.org/W6628750762","https://openalex.org/W6629265943","https://openalex.org/W6632472715","https://openalex.org/W6635896488","https://openalex.org/W6637089771","https://openalex.org/W6680662060","https://openalex.org/W6681242987"],"related_works":["https://openalex.org/W4231226332","https://openalex.org/W2043128599","https://openalex.org/W2530779535","https://openalex.org/W3037575264","https://openalex.org/W4256662921","https://openalex.org/W2519801912","https://openalex.org/W2182337998","https://openalex.org/W3140018618","https://openalex.org/W2299731084","https://openalex.org/W3085911097"],"abstract_inverted_index":{"A":[0],"new":[1],"methodology":[2],"that":[3,64],"structures":[4],"the":[5,13,65,92,96],"semantics":[6,94],"of":[7,10,15,95],"a":[8,16,21,27,32,36],"collection":[9],"documents":[11,42],"into":[12,46],"geometry":[14],"simplicial":[17],"complex":[18],"is":[19,24],"developed:":[20],"primitive":[22],"concept":[23],"represented":[25],"by":[26],"top":[28],"dimension":[29],"simplex,":[30],"and":[31,59,81],"connected":[33],"component":[34],"represents":[35],"concept.":[37],"Based":[38],"on":[39],"these":[40],"structures,":[41],"can":[43],"be":[44],"clustered":[45],"some":[47],"meaningful":[48],"classes.":[49],"Experiments":[50],"with":[51],"three":[52],"different":[53],"data":[54],"sets":[55],"from":[56],"web":[57],"pages":[58],"medical":[60],"literature":[61],"have":[62,90],"shown":[63],"proposed":[66],"unsupervised":[67],"clustering":[68,75,83],"approach":[69],"performs":[70],"significantly":[71],"better":[72],"than":[73],"traditional":[74],"algorithms,":[76],"such":[77],"as":[78],"k-means,":[79],"AutoClass":[80],"hierarchical":[82],"(HAC).":[84],"This":[85],"abstract":[86],"geometric":[87],"model":[88],"seems":[89],"captured":[91],"intrinsic":[93],"documents.":[97]},"counts_by_year":[{"year":2014,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
