{"id":"https://openalex.org/W1971155008","doi":"https://doi.org/10.1109/bigdata.2013.6691602","title":"Fast scalable selection algorithms for large scale data","display_name":"Fast scalable selection algorithms for large scale data","publication_year":2013,"publication_date":"2013-10-01","ids":{"openalex":"https://openalex.org/W1971155008","doi":"https://doi.org/10.1109/bigdata.2013.6691602","mag":"1971155008"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata.2013.6691602","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2013.6691602","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE International Conference on Big Data","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037515970","display_name":"Lee Parnell Thompson","orcid":null},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Lee Parnell Thompson","raw_affiliation_strings":["Department of Computer Science, University of Texas at Austin, Austin, TX","Department of Computer Science, University of Texas at Austin, Austin, TX, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Texas at Austin, Austin, TX","institution_ids":["https://openalex.org/I86519309"]},{"raw_affiliation_string":"Department of Computer Science, University of Texas at Austin, Austin, TX, USA#TAB#","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101883722","display_name":"Weijia Xu","orcid":"https://orcid.org/0000-0002-5134-6381"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Weijia Xu","raw_affiliation_strings":["Texas Advanced Computing Center, University of Texas at Austin, Austin, TX","Texas Adv. Comput. Center, Univ. of Texas at Austin, Austin, TX, USA"],"affiliations":[{"raw_affiliation_string":"Texas Advanced Computing Center, University of Texas at Austin, Austin, TX","institution_ids":[]},{"raw_affiliation_string":"Texas Adv. Comput. Center, Univ. of Texas at Austin, Austin, TX, USA","institution_ids":["https://openalex.org/I86519309"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083499808","display_name":"Daniel P. Miranker","orcid":"https://orcid.org/0009-0003-8838-2890"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Daniel P. Miranker","raw_affiliation_strings":["Department of Computer Science, University of Texas at Austin, Austin, TX","Department of Computer Science, University of Texas at Austin, Austin, TX, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Texas at Austin, Austin, TX","institution_ids":["https://openalex.org/I86519309"]},{"raw_affiliation_string":"Department of Computer Science, University of Texas at Austin, Austin, TX, USA#TAB#","institution_ids":["https://openalex.org/I86519309"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5037515970"],"corresponding_institution_ids":["https://openalex.org/I86519309"],"apc_list":null,"apc_paid":null,"fwci":0.809,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.81158399,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"412","last_page":"420"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9908000230789185,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.8289902210235596},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8037735819816589},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.6886485815048218},{"id":"https://openalex.org/keywords/sorting","display_name":"Sorting","score":0.6476743817329407},{"id":"https://openalex.org/keywords/workload","display_name":"Workload","score":0.6245556473731995},{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.5815474987030029},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5554987788200378},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4786566495895386},{"id":"https://openalex.org/keywords/selection-algorithm","display_name":"Selection algorithm","score":0.4611499607563019},{"id":"https://openalex.org/keywords/map-reduce","display_name":"Map reduce","score":0.4554831385612488},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.44397449493408203},{"id":"https://openalex.org/keywords/volume","display_name":"Volume (thermodynamics)","score":0.43713492155075073},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.38893961906433105},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.3130861818790436},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.22682848572731018},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.20552515983581543}],"concepts":[{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.8289902210235596},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8037735819816589},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.6886485815048218},{"id":"https://openalex.org/C111696304","wikidata":"https://www.wikidata.org/wiki/Q2303697","display_name":"Sorting","level":2,"score":0.6476743817329407},{"id":"https://openalex.org/C2778476105","wikidata":"https://www.wikidata.org/wiki/Q628539","display_name":"Workload","level":2,"score":0.6245556473731995},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.5815474987030029},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5554987788200378},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4786566495895386},{"id":"https://openalex.org/C2775973920","wikidata":"https://www.wikidata.org/wiki/Q3252726","display_name":"Selection algorithm","level":3,"score":0.4611499607563019},{"id":"https://openalex.org/C3019257732","wikidata":"https://www.wikidata.org/wiki/Q567759","display_name":"Map reduce","level":3,"score":0.4554831385612488},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.44397449493408203},{"id":"https://openalex.org/C20556612","wikidata":"https://www.wikidata.org/wiki/Q4469374","display_name":"Volume (thermodynamics)","level":2,"score":0.43713492155075073},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.38893961906433105},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.3130861818790436},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.22682848572731018},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.20552515983581543},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata.2013.6691602","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2013.6691602","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE International Conference on Big Data","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.4099999964237213,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320310620","display_name":"University of Texas at Austin","ror":"https://ror.org/00hj54h04"},{"id":"https://openalex.org/F4320332161","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W202290546","https://openalex.org/W1525159070","https://openalex.org/W1556524945","https://openalex.org/W1792966054","https://openalex.org/W1996641400","https://openalex.org/W2000337320","https://openalex.org/W2060556416","https://openalex.org/W2074499935","https://openalex.org/W2074982700","https://openalex.org/W2082357899","https://openalex.org/W2092446961","https://openalex.org/W2098935637","https://openalex.org/W2169178492","https://openalex.org/W2173213060","https://openalex.org/W4231266747","https://openalex.org/W4235295823","https://openalex.org/W6631656446"],"related_works":["https://openalex.org/W2000785801","https://openalex.org/W986318368","https://openalex.org/W2384410913","https://openalex.org/W2352878646","https://openalex.org/W2004734601","https://openalex.org/W2130149817","https://openalex.org/W2990194547","https://openalex.org/W1480123525","https://openalex.org/W2620865396","https://openalex.org/W2115605707"],"abstract_inverted_index":{"Selection":[0],"finding,":[1,8,144],"and":[2,22,40,108,166,205,241],"its":[3],"most":[4],"common":[5,230],"form":[6],"median":[7],"are":[9,62,80,200,246],"used":[10,160],"as":[11,30,41,86],"a":[12,31,63,74,121,170,183,195,208],"measure":[13],"of":[14,65,68,73,78,89,123,142,191],"central":[15],"tendency":[16],"for":[17,57,135,139,194,203],"problems":[18,25],"in":[19,82,102,151,207,225,232],"biology,":[20],"databases,":[21],"graphics.":[23],"These":[24],"often":[26],"require":[27],"selection":[28,70,110,143,164],"finding":[29,111,146],"subcomponent":[32],"where":[33],"it":[34],"can":[35,97],"be":[36,53],"called":[37],"many":[38],"times,":[39],"such":[42],"speed":[43],"is":[44],"important.":[45],"The":[46,218],"Map/Reduce":[47,75,137,175],"framework":[48,138,176],"has":[49,113],"been":[50,131],"shown":[51],"to":[52,99,116,120,186,214],"an":[54,106,152],"important":[55],"tool":[56],"creating":[58],"scalable":[59,109],"applications.":[60,124],"There":[61],"number":[64,122],"valid":[66],"implementations":[67,245],"the":[69,87,114,136,140,147,158,174,188,198,222],"algorithms":[71,128,165,199],"inside":[72],"framework,":[76],"certain":[77],"which":[79],"compared":[81,201],"this":[83,226],"paper.":[84],"However,":[85],"volume":[88],"data":[90],"increases,":[91],"subtle":[92],"theoretical":[93],"algorithmic":[94],"implementation":[95],"differences":[96,101],"lead":[98],"significant":[100],"practical":[103],"application.":[104],"Therefore,":[105],"efficient":[107],"method":[112,172],"potential":[115],"provide":[117],"general":[118],"benefit":[119],"This":[125,155],"paper":[126,156,227],"compares":[127],"that":[129,221],"have":[130],"redesigned":[132],"or":[133],"created":[134],"purpose":[141],"or,":[145],"k-th":[148],"ranked":[149],"element":[150],"unordered":[153],"set.":[154],"takes":[157],"concepts":[159],"from":[161],"two":[162,178],"existing":[163],"translates":[167],"them":[168],"into":[169],"novel":[171],"using":[173,238],"with":[177,212,235],"variations.":[179],"Each":[180],"approach":[181],"uses":[182],"different":[184],"methodology":[185],"reduce":[187],"total":[189],"amount":[190],"workload":[192],"needed":[193],"selection.":[196],"All":[197],"together":[202],"scalability":[204],"efficiency":[206],"computing":[209],"cluster":[210],"environment":[211],"up":[213],"256":[215],"processing":[216],"cores.":[217],"results":[219],"show":[220],"methods":[223],"proposed":[224],"outperform":[228],"several":[229],"alternatives":[231],"identifying":[233],"medians":[234],"Hadoop,":[236],"including":[237],"sorting,":[239],"Pig,":[240],"BinMedian":[242],"methods.":[243],"Our":[244],"also":[247],"available":[248],"upon":[249],"request.":[250]},"counts_by_year":[{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
