{"id":"https://openalex.org/W2133601909","doi":"https://doi.org/10.1109/hipc.2009.5433188","title":"Performance optimizations for distributed real-time text indexing","display_name":"Performance optimizations for distributed real-time text indexing","publication_year":2009,"publication_date":"2009-12-01","ids":{"openalex":"https://openalex.org/W2133601909","doi":"https://doi.org/10.1109/hipc.2009.5433188","mag":"2133601909"},"language":"en","primary_location":{"id":"doi:10.1109/hipc.2009.5433188","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hipc.2009.5433188","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 International Conference on High Performance Computing (HiPC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109064591","display_name":"Ankur Narang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210103279","display_name":"IBM Research - India","ror":"https://ror.org/014wt7r80","country_code":"IN","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210103279","https://openalex.org/I4210114115"]},{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["IN","US"],"is_corresponding":true,"raw_author_name":"Ankur Narang","raw_affiliation_strings":["IBM India Research Laboratory, New Delhi, India","IBM India Research Laboratory, New Delhi, India#TAB#"],"affiliations":[{"raw_affiliation_string":"IBM India Research Laboratory, New Delhi, India","institution_ids":["https://openalex.org/I4210103279"]},{"raw_affiliation_string":"IBM India Research Laboratory, New Delhi, India#TAB#","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102006304","display_name":"Karthik Swaminathan","orcid":"https://orcid.org/0000-0002-4799-7587"},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]},{"id":"https://openalex.org/I4210103279","display_name":"IBM Research - India","ror":"https://ror.org/014wt7r80","country_code":"IN","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210103279","https://openalex.org/I4210114115"]}],"countries":["IN","US"],"is_corresponding":false,"raw_author_name":"Karthik Swaminathan","raw_affiliation_strings":["IBM India Research Laboratory, New Delhi, India","IBM India Research Laboratory, New Delhi, India#TAB#"],"affiliations":[{"raw_affiliation_string":"IBM India Research Laboratory, New Delhi, India","institution_ids":["https://openalex.org/I4210103279"]},{"raw_affiliation_string":"IBM India Research Laboratory, New Delhi, India#TAB#","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5028084401","display_name":"Prashant Agrawal","orcid":"https://orcid.org/0000-0002-7890-024X"},"institutions":[{"id":"https://openalex.org/I4210103279","display_name":"IBM Research - India","ror":"https://ror.org/014wt7r80","country_code":"IN","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210103279","https://openalex.org/I4210114115"]},{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["IN","US"],"is_corresponding":false,"raw_author_name":"Prashant Agrawal","raw_affiliation_strings":["IBM India Research Laboratory, New Delhi, India","IBM India Research Laboratory, New Delhi, India#TAB#"],"affiliations":[{"raw_affiliation_string":"IBM India Research Laboratory, New Delhi, India","institution_ids":["https://openalex.org/I4210103279"]},{"raw_affiliation_string":"IBM India Research Laboratory, New Delhi, India#TAB#","institution_ids":["https://openalex.org/I1341412227"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5109064591"],"corresponding_institution_ids":["https://openalex.org/I1341412227","https://openalex.org/I4210103279"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.1300359,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":"52","issue":null,"first_page":"398","last_page":"407"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10742","display_name":"Peer-to-Peer Network Technologies","score":0.992900013923645,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.8157094717025757},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7961245775222778},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7621269822120667},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5471484065055847},{"id":"https://openalex.org/keywords/massively-parallel","display_name":"Massively parallel","score":0.5125236511230469},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.49804210662841797},{"id":"https://openalex.org/keywords/index","display_name":"Index (typography)","score":0.4916239380836487},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3355664312839508},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.1980333924293518},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.17055749893188477},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.11561018228530884}],"concepts":[{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.8157094717025757},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7961245775222778},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7621269822120667},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5471484065055847},{"id":"https://openalex.org/C190475519","wikidata":"https://www.wikidata.org/wiki/Q544384","display_name":"Massively parallel","level":2,"score":0.5125236511230469},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.49804210662841797},{"id":"https://openalex.org/C2777382242","wikidata":"https://www.wikidata.org/wiki/Q6017816","display_name":"Index (typography)","level":2,"score":0.4916239380836487},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3355664312839508},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.1980333924293518},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.17055749893188477},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.11561018228530884},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.0},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hipc.2009.5433188","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hipc.2009.5433188","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 International Conference on High Performance Computing (HiPC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W1578100948","https://openalex.org/W1985102977","https://openalex.org/W2022578651","https://openalex.org/W2059387258","https://openalex.org/W2124306283","https://openalex.org/W2135552899","https://openalex.org/W2140795521","https://openalex.org/W2173213060","https://openalex.org/W3003506064","https://openalex.org/W6634462686","https://openalex.org/W6678405132"],"related_works":["https://openalex.org/W2023839151","https://openalex.org/W1774183074","https://openalex.org/W2057488824","https://openalex.org/W4401278057","https://openalex.org/W2334687145","https://openalex.org/W2178011914","https://openalex.org/W4235962491","https://openalex.org/W2061778832","https://openalex.org/W1513001507","https://openalex.org/W2257153718"],"abstract_inverted_index":{"DISC":[0,10],"(Data-Intensive":[1],"Super":[2],"Computing)":[3],"is":[4,213,286],"gaining":[5],"strong":[6,262],"research":[7],"momentum":[8],"[1].":[9],"systems":[11,99],"differ":[12],"from":[13],"conventional":[14],"supercomputers":[15],"in":[16,31,187,261],"their":[17],"focus":[18],"on":[19,97,198,235,249,276,293],"data,":[20,211],"as":[21,230],"they":[22],"acquire":[23],"and":[24,51,75,123,133,142,167,177,184,222,263],"maintain":[25],"continually":[26],"changing":[27],"massive":[28,93],"data":[29,56,95],"sets,":[30],"addition":[32],"to":[33],"performing":[34],"large-scale":[35],"computations":[36],"over":[37,125,271],"the":[38,45,149,156,180,188,217,236,259,272,280,287],"data.":[39],"Towards":[40],"this":[41,79,285],"end,":[42],"we":[43,131,154],"consider":[44],"problem":[46,80],"of":[47,92,103,158,182,195,201,239,246,266,282],"real-time":[48],"text":[49,90],"indexing":[50,91,112,122,193,227,269,289],"search":[52,70,107,124,254,300],"with":[53,63,105,161,169,252,298],"high":[54],"input":[55,94],"rates":[57],"(10":[58],"GB/s":[59],"or":[60],"more)":[61],"along":[62],"small":[64,164],"index":[65],"age-off":[66],"time":[67,152],"while":[68],"sustaining":[69],"response":[71],"time.":[72],"Load":[73],"imbalance":[74],"communication":[76,135],"bottlenecks":[77],"make":[78],"particularly":[81],"challenging.":[82],"We":[83,190,256],"present":[84],"performance":[85,108],"optimizations":[86,136],"for":[87,148,163,171],"distributed":[88,111,268],"in-memory":[89],"sets":[96],"parallel":[98,127,151],"having":[100],"large":[101,295],"number":[102,181,238],"cores/processors,":[104],"sustained":[106,253,299],"[2].":[109],"Our":[110],"algorithm":[113,160,270],"uses":[114],"a":[115,294],"hybrid":[116],"group-based":[117],"approach":[118],"which":[119,212],"enables":[120],"scalable":[121],"massively":[126],"systems.":[128],"In":[129],"addition,":[130],"designed":[132],"analyzed":[134],"including":[137],"routing":[138],"using":[139,207],"Steiner":[140],"nodes":[141,200,251],"topology":[143],"mapping.":[144],"Using":[145],"theoretical":[146],"analysis":[147],"asymptotic":[150],"complexity":[153],"establish":[155],"scalability":[157,168,265],"our":[159,267,283],"|P|":[162,176],"index-group":[165,173],"size":[166],"|C|":[170,178],"larger":[172],"size;":[174],"where":[175],"are":[179],"Producers":[183],"Consumers":[185],"respectively,":[186],"index-group.":[189],"have":[191],"obtained":[192],"throughput":[194,220,245,290],"524":[196],"GB/min":[197],"4K":[199],"Blue":[202,277],"Gene/L":[203],"<sup":[204,232],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[205,233],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">1</sup>":[206],"actual":[208],"IBM":[209],"intranet":[210],"3.36x":[214],"better":[215,224],"than":[216,225],"previous":[218,273],"best":[219,274,281],"[3]":[221,275],"10.3x":[223],"typical":[226],"approaches":[228],"such":[229],"CLucene":[231],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">2</sup>":[234],"same":[237],"nodes.":[240],"This":[241],"gives":[242],"an":[243],"estimated":[244],"17":[247],"TB/min":[248],"128K":[250],"performance.":[255,301],"also":[257],"demonstrate":[258],"improvements":[260],"weak":[264],"Gene/L.":[278],"To":[279],"knowledge,":[284],"highest":[288],"ever":[291],"published":[292],"scale":[296],"system":[297]},"counts_by_year":[{"year":2022,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
