{"id":"https://openalex.org/W2145030516","doi":"https://doi.org/10.1007/978-3-540-74628-7_22","title":"On the Relative Hardness of Clustering Corpora","display_name":"On the Relative Hardness of Clustering Corpora","publication_year":2007,"publication_date":"2007-08-18","ids":{"openalex":"https://openalex.org/W2145030516","doi":"https://doi.org/10.1007/978-3-540-74628-7_22","mag":"2145030516"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-540-74628-7_22","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-540-74628-7_22","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016612157","display_name":"David Pinto","orcid":"https://orcid.org/0000-0002-8516-5925"},"institutions":[{"id":"https://openalex.org/I60053951","display_name":"Universitat Polit\u00e8cnica de Val\u00e8ncia","ror":"https://ror.org/01460j859","country_code":"ES","type":"education","lineage":["https://openalex.org/I60053951"]},{"id":"https://openalex.org/I721619","display_name":"Benem\u00e9rita Universidad Aut\u00f3noma de Puebla","ror":"https://ror.org/03p2z7827","country_code":"MX","type":"education","lineage":["https://openalex.org/I721619"]}],"countries":["ES","MX"],"is_corresponding":false,"raw_author_name":"David Pinto","raw_affiliation_strings":["B. Autonomous University of Puebla, Mexico","Department of Information Systems and Computation, Polytechnic University of Valencia, Spain, Faculty of Computer Science, \u00a0","Department of Information Systems and Computation, Polytechnic University of Valencia, Spain, Faculty of Computer Science,"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"B. Autonomous University of Puebla, Mexico","institution_ids":["https://openalex.org/I721619"]},{"raw_affiliation_string":"Department of Information Systems and Computation, Polytechnic University of Valencia, Spain, Faculty of Computer Science, \u00a0","institution_ids":["https://openalex.org/I60053951"]},{"raw_affiliation_string":"Department of Information Systems and Computation, Polytechnic University of Valencia, Spain, Faculty of Computer Science,","institution_ids":["https://openalex.org/I60053951"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053947754","display_name":"Paolo Rosso","orcid":"https://orcid.org/0000-0002-8922-1242"},"institutions":[{"id":"https://openalex.org/I60053951","display_name":"Universitat Polit\u00e8cnica de Val\u00e8ncia","ror":"https://ror.org/01460j859","country_code":"ES","type":"education","lineage":["https://openalex.org/I60053951"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Paolo Rosso","raw_affiliation_strings":["Department of Information Systems and Computation, Polytechnic University of Valencia, Spain, Faculty of Computer Science, \u00a0","Department of Information Systems and Computation, Polytechnic University of Valencia, Spain, Faculty of Computer Science,"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Information Systems and Computation, Polytechnic University of Valencia, Spain, Faculty of Computer Science, \u00a0","institution_ids":["https://openalex.org/I60053951"]},{"raw_affiliation_string":"Department of Information Systems and Computation, Polytechnic University of Valencia, Spain, Faculty of Computer Science,","institution_ids":["https://openalex.org/I60053951"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":null,"fwci":2.9711,"has_fulltext":false,"cited_by_count":23,"citation_normalized_percentile":{"value":0.92700039,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"155","last_page":"161"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.89640212059021},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6292725801467896},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.5915695428848267},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5766239166259766},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5290882587432861},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5107057690620422},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5026683807373047},{"id":"https://openalex.org/keywords/conceptual-clustering","display_name":"Conceptual clustering","score":0.470491886138916},{"id":"https://openalex.org/keywords/document-clustering","display_name":"Document clustering","score":0.4288294315338135},{"id":"https://openalex.org/keywords/brown-clustering","display_name":"Brown clustering","score":0.42500197887420654},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.408785343170166},{"id":"https://openalex.org/keywords/correlation-clustering","display_name":"Correlation clustering","score":0.31410643458366394},{"id":"https://openalex.org/keywords/cure-data-clustering-algorithm","display_name":"CURE data clustering algorithm","score":0.31320926547050476},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.08343252539634705},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.060770004987716675},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.050034910440444946}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.89640212059021},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6292725801467896},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.5915695428848267},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5766239166259766},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5290882587432861},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5107057690620422},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5026683807373047},{"id":"https://openalex.org/C39235581","wikidata":"https://www.wikidata.org/wiki/Q5158434","display_name":"Conceptual clustering","level":5,"score":0.470491886138916},{"id":"https://openalex.org/C177937566","wikidata":"https://www.wikidata.org/wiki/Q4223102","display_name":"Document clustering","level":3,"score":0.4288294315338135},{"id":"https://openalex.org/C167984511","wikidata":"https://www.wikidata.org/wiki/Q17003931","display_name":"Brown clustering","level":5,"score":0.42500197887420654},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.408785343170166},{"id":"https://openalex.org/C94641424","wikidata":"https://www.wikidata.org/wiki/Q5172845","display_name":"Correlation clustering","level":3,"score":0.31410643458366394},{"id":"https://openalex.org/C33704608","wikidata":"https://www.wikidata.org/wiki/Q5014717","display_name":"CURE data clustering algorithm","level":4,"score":0.31320926547050476},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.08343252539634705},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.060770004987716675},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.050034910440444946},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/978-3-540-74628-7_22","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-540-74628-7_22","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W133449889","https://openalex.org/W1501099340","https://openalex.org/W1519573080","https://openalex.org/W1580638181","https://openalex.org/W1588215433","https://openalex.org/W1651266083","https://openalex.org/W1836741323","https://openalex.org/W1911857613","https://openalex.org/W2034986427","https://openalex.org/W2100074460"],"related_works":["https://openalex.org/W2622412490","https://openalex.org/W1957537378","https://openalex.org/W2160785859","https://openalex.org/W2087424554","https://openalex.org/W2101637161","https://openalex.org/W2385630304","https://openalex.org/W3140018618","https://openalex.org/W2607137685","https://openalex.org/W3168918549","https://openalex.org/W2049890817"],"abstract_inverted_index":null,"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
