{"id":"https://openalex.org/W3175378934","doi":"https://doi.org/10.1145/3448016.3457319","title":"Efficient String Sort with Multi-Character Encoding and Adaptive Sampling","display_name":"Efficient String Sort with Multi-Character Encoding and Adaptive Sampling","publication_year":2021,"publication_date":"2021-06-09","ids":{"openalex":"https://openalex.org/W3175378934","doi":"https://doi.org/10.1145/3448016.3457319","mag":"3175378934"},"language":"en","primary_location":{"id":"doi:10.1145/3448016.3457319","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3448016.3457319","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2021 International Conference on Management of Data","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102943951","display_name":"Wen Jin","orcid":"https://orcid.org/0000-0002-5992-2531"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wen Jin","raw_affiliation_strings":["Independent Researcher, Vancouver, BC, Canada"],"affiliations":[{"raw_affiliation_string":"Independent Researcher, Vancouver, BC, Canada","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089931216","display_name":"Weining Qian","orcid":"https://orcid.org/0000-0002-4132-8630"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weining Qian","raw_affiliation_strings":["East China Normal University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"East China Normal University, Shanghai, China","institution_ids":["https://openalex.org/I66867065"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101511862","display_name":"Aoying Zhou","orcid":"https://orcid.org/0000-0002-4665-7302"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Aoying Zhou","raw_affiliation_strings":["East China Normal University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"East China Normal University, Shanghai, China","institution_ids":["https://openalex.org/I66867065"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5102943951"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.136,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.53149618,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"872","last_page":"884"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12326","display_name":"Network Packet Processing and Optimization","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sort","display_name":"sort","score":0.7340303659439087},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7092748284339905},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.6810091137886047},{"id":"https://openalex.org/keywords/character","display_name":"Character (mathematics)","score":0.6755018830299377},{"id":"https://openalex.org/keywords/string","display_name":"String (physics)","score":0.576054573059082},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.4572775363922119},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.4370790719985962},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3785797953605652},{"id":"https://openalex.org/keywords/arithmetic","display_name":"Arithmetic","score":0.3493499755859375},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.25900062918663025},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2273084819316864},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.09293988347053528},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.0858469009399414}],"concepts":[{"id":"https://openalex.org/C88548561","wikidata":"https://www.wikidata.org/wiki/Q347599","display_name":"sort","level":2,"score":0.7340303659439087},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7092748284339905},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.6810091137886047},{"id":"https://openalex.org/C2780861071","wikidata":"https://www.wikidata.org/wiki/Q1062934","display_name":"Character (mathematics)","level":2,"score":0.6755018830299377},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.576054573059082},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4572775363922119},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.4370790719985962},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3785797953605652},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.3493499755859375},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.25900062918663025},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2273084819316864},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.09293988347053528},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0858469009399414},{"id":"https://openalex.org/C37914503","wikidata":"https://www.wikidata.org/wiki/Q156495","display_name":"Mathematical physics","level":1,"score":0.0},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3448016.3457319","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3448016.3457319","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2021 International Conference on Management of Data","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5699999928474426,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1490429615","https://openalex.org/W1539580421","https://openalex.org/W1574212840","https://openalex.org/W1852127287","https://openalex.org/W1864523757","https://openalex.org/W1902965424","https://openalex.org/W2031833362","https://openalex.org/W2055768308","https://openalex.org/W2065457989","https://openalex.org/W2068361557","https://openalex.org/W2080092059","https://openalex.org/W2125027776","https://openalex.org/W2125449202","https://openalex.org/W2130664790","https://openalex.org/W2157718155","https://openalex.org/W2293095839","https://openalex.org/W2962856362","https://openalex.org/W3029541804","https://openalex.org/W3139694570","https://openalex.org/W4245107430","https://openalex.org/W6602011139"],"related_works":["https://openalex.org/W2389073067","https://openalex.org/W3110976612","https://openalex.org/W2359478580","https://openalex.org/W2394184555","https://openalex.org/W2367039694","https://openalex.org/W2355476020","https://openalex.org/W1573092629","https://openalex.org/W2949751574","https://openalex.org/W2133764934","https://openalex.org/W1509806135"],"abstract_inverted_index":{"Sorting":[0],"plays":[1],"a":[2,37,83,201],"fundamental":[3],"role":[4],"in":[5,13,60,122,200],"computer":[6],"science.":[7],"It":[8],"has":[9],"far":[10],"reaching":[11],"applications":[12],"database":[14],"operations":[15],"and":[16,28,151,165,192],"data":[17],"science":[18],"tasks.":[19],"An":[20],"important":[21],"class":[22],"of":[23,71,101,112,115,224],"sorting":[24,32,62,142,157,217],"keys":[25],"are":[26,119],"strings":[27,190],"among":[29],"all":[30],"string":[31,50,216],"methods,":[33],"radix":[34,49,73,146],"sort":[35,147,150],"is":[36,55,207],"simple":[38],"but":[39],"effective":[40,127],"algorithm.":[41],"Many":[42],"works":[43],"have":[44],"been":[45],"studied":[46],"to":[47,56,135],"accelerate":[48],"sort.":[51],"One":[52],"typical":[53],"approach":[54,66],"process":[57,134],"multiple":[58],"characters":[59],"each":[61],"pass.":[63],"However,":[64],"this":[65],"incurs":[67],"the":[68,72,79,93,102,110,116,126,137,185,195,212,222],"crucial":[69],"issue":[70],"being":[74],"too":[75],"large.":[76],"To":[77],"address":[78],"problem,":[80],"we":[81],"introduce":[82],"novel":[84],"multi-character":[85],"encoding":[86,97,128,138],"based":[87],"method":[88,171],"that":[89,169],"can":[90],"significantly":[91],"reduce":[92],"radix.":[94],"This":[95],"new":[96],"scheme":[98,129],"takes":[99],"advantage":[100],"sparse":[103],"alphabet":[104],"space":[105],"usage":[106],"as":[107,109],"well":[108],"sparsity":[111],"distinguishing":[113],"prefixes":[114],"inputs":[117],"which":[118,220],"commonly":[120],"seen":[121],"real-world":[123],"datasets.":[124],"Combining":[125],"with":[130,148],"an":[131,173],"adaptive":[132],"sampling":[133],"generate":[136],"efficiently,":[139],"our":[140,170,225],"proposed":[141],"algorithm":[143,218],"essentially":[144],"blends":[145],"sample":[149],"achieves":[152],"substantial":[153],"improvement":[154,177,183],"over":[155,178,184,194],"other":[156],"approaches.":[158],"The":[159],"results":[160],"on":[161,189],"both":[162],"real":[163],"datasets":[164,167],"synthetic":[166],"show":[168,205],"yields":[172],"average":[174],"4.85\u00d7":[175],"performance":[176],"C++":[179],"STL":[180],"sort[21],":[181],"1.47\u00d7":[182],"state-of-the-art":[186],"Radix":[187],"Sort":[188],"implementation[19]":[191],"2.55\u00d7":[193],"multikey":[196],"quicksort[6].":[197],"Preliminary":[198],"tests":[199],"multi-core":[202],"environment":[203],"also":[204],"it":[206],"competitive":[208],"or":[209],"better":[210],"than":[211],"most":[213],"recent":[214],"parallel":[215],"pS5[8]":[219],"demonstrates":[221],"scalability":[223],"method.":[226]},"counts_by_year":[{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
