{"id":"https://openalex.org/W2057870902","doi":"https://doi.org/10.1145/1458082.1458105","title":"An empirical study of required dimensionality for large-scale latent semantic indexing applications","display_name":"An empirical study of required dimensionality for large-scale latent semantic indexing applications","publication_year":2008,"publication_date":"2008-10-26","ids":{"openalex":"https://openalex.org/W2057870902","doi":"https://doi.org/10.1145/1458082.1458105","mag":"2057870902"},"language":"en","primary_location":{"id":"doi:10.1145/1458082.1458105","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1458082.1458105","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 17th ACM conference on Information and knowledge management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088893823","display_name":"Roger Bradford","orcid":"https://orcid.org/0000-0003-1750-3125"},"institutions":[{"id":"https://openalex.org/I138285227","display_name":"Agilent Technologies (United States)","ror":"https://ror.org/02tryst02","country_code":"US","type":"company","lineage":["https://openalex.org/I138285227"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Roger B. Bradford","raw_affiliation_strings":["Agilex Technologies, Chantilly, VA, USA"],"affiliations":[{"raw_affiliation_string":"Agilex Technologies, Chantilly, VA, USA","institution_ids":["https://openalex.org/I138285227"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5088893823"],"corresponding_institution_ids":["https://openalex.org/I138285227"],"apc_list":null,"apc_paid":null,"fwci":11.2036,"has_fulltext":false,"cited_by_count":142,"citation_normalized_percentile":{"value":0.98222429,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"153","last_page":"162"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9937000274658203,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7572758793830872},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.7384740710258484},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.720963180065155},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.535027027130127},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5208666324615479},{"id":"https://openalex.org/keywords/probabilistic-latent-semantic-analysis","display_name":"Probabilistic latent semantic analysis","score":0.5111966729164124},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.48733219504356384},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.45979899168014526},{"id":"https://openalex.org/keywords/singular-value-decomposition","display_name":"Singular value decomposition","score":0.4474598169326782},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3648790121078491},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.2766833007335663},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.270749032497406},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.16546401381492615}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7572758793830872},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.7384740710258484},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.720963180065155},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.535027027130127},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5208666324615479},{"id":"https://openalex.org/C112933361","wikidata":"https://www.wikidata.org/wiki/Q2845258","display_name":"Probabilistic latent semantic analysis","level":2,"score":0.5111966729164124},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.48733219504356384},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.45979899168014526},{"id":"https://openalex.org/C22789450","wikidata":"https://www.wikidata.org/wiki/Q420904","display_name":"Singular value decomposition","level":2,"score":0.4474598169326782},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3648790121078491},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.2766833007335663},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.270749032497406},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.16546401381492615},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1458082.1458105","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1458082.1458105","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 17th ACM conference on Information and knowledge management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":63,"referenced_works":["https://openalex.org/W41480884","https://openalex.org/W41690797","https://openalex.org/W81719197","https://openalex.org/W93781279","https://openalex.org/W101693742","https://openalex.org/W115700959","https://openalex.org/W121163546","https://openalex.org/W156841640","https://openalex.org/W156967137","https://openalex.org/W159518475","https://openalex.org/W204086241","https://openalex.org/W849495462","https://openalex.org/W1484719069","https://openalex.org/W1491334865","https://openalex.org/W1520286206","https://openalex.org/W1529131185","https://openalex.org/W1534523911","https://openalex.org/W1553600843","https://openalex.org/W1582918847","https://openalex.org/W1584739173","https://openalex.org/W1602633340","https://openalex.org/W1732828232","https://openalex.org/W1878377492","https://openalex.org/W1982628673","https://openalex.org/W1983578042","https://openalex.org/W1991713115","https://openalex.org/W2049384587","https://openalex.org/W2058616517","https://openalex.org/W2062630764","https://openalex.org/W2066532839","https://openalex.org/W2109749916","https://openalex.org/W2110480283","https://openalex.org/W2126416132","https://openalex.org/W2126915677","https://openalex.org/W2131904442","https://openalex.org/W2142189579","https://openalex.org/W2145631291","https://openalex.org/W2145819623","https://openalex.org/W2146012283","https://openalex.org/W2147152072","https://openalex.org/W2149285182","https://openalex.org/W2149684740","https://openalex.org/W2152311353","https://openalex.org/W2153508286","https://openalex.org/W2156553253","https://openalex.org/W2161308148","https://openalex.org/W2168625136","https://openalex.org/W2397021650","https://openalex.org/W2599276130","https://openalex.org/W2608500270","https://openalex.org/W2622806907","https://openalex.org/W2749873526","https://openalex.org/W2760669695","https://openalex.org/W2954620812","https://openalex.org/W2979473749","https://openalex.org/W3009569740","https://openalex.org/W3099898773","https://openalex.org/W4229898513","https://openalex.org/W4285719527","https://openalex.org/W4403333810","https://openalex.org/W6603779292","https://openalex.org/W6681698864","https://openalex.org/W6682410943"],"related_works":["https://openalex.org/W4389358162","https://openalex.org/W2033524022","https://openalex.org/W2111020819","https://openalex.org/W2377594161","https://openalex.org/W2296297476","https://openalex.org/W2329943782","https://openalex.org/W1578340400","https://openalex.org/W2365514879","https://openalex.org/W15987807","https://openalex.org/W2420905679"],"abstract_inverted_index":{"The":[0],"technique":[1],"of":[2,12,45,64,76],"latent":[3],"semantic":[4],"indexing":[5],"is":[6],"used":[7],"in":[8,42,67],"a":[9],"wide":[10],"variety":[11],"commercial":[13,56],"applications.":[14],"In":[15,54],"these":[16],"applications,":[17,58],"the":[18,28,43,50,74],"processing":[19,29],"time":[20,30],"and":[21,27,31],"RAM":[22,32],"required":[23,33],"for":[24,49],"SVD":[25],"computation,":[26],"during":[34],"LSI":[35,51,57],"retrieval":[36],"operations":[37],"are":[38],"all":[39],"roughly":[40],"linear":[41],"number":[44],"dimensions,":[46],"k,":[47],"chosen":[48],"representation":[52],"space.":[53],"large-scale":[55],"reducing":[59,68],"k":[60],"values":[61],"could":[62],"be":[63],"significant":[65],"value":[66],"server":[69],"costs.":[70],"This":[71],"paper":[72],"explores":[73],"effects":[75],"varying":[77],"dimensionality.":[78]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":8},{"year":2020,"cited_by_count":7},{"year":2019,"cited_by_count":10},{"year":2018,"cited_by_count":12},{"year":2017,"cited_by_count":11},{"year":2016,"cited_by_count":10},{"year":2015,"cited_by_count":13},{"year":2014,"cited_by_count":14},{"year":2013,"cited_by_count":15},{"year":2012,"cited_by_count":9}],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2025-10-10T00:00:00"}
