{"id":"https://openalex.org/W2585767516","doi":"https://doi.org/10.1109/bigdata.2016.7840607","title":"YinMem: A distributed parallel indexed in-memory computation system for large scale data analytics","display_name":"YinMem: A distributed parallel indexed in-memory computation system for large scale data analytics","publication_year":2016,"publication_date":"2016-12-01","ids":{"openalex":"https://openalex.org/W2585767516","doi":"https://doi.org/10.1109/bigdata.2016.7840607","mag":"2585767516"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata.2016.7840607","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2016.7840607","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109833458","display_name":"Yin Huang","orcid":"https://orcid.org/0000-0001-7370-7259"},"institutions":[{"id":"https://openalex.org/I79272384","display_name":"University of Maryland, Baltimore County","ror":"https://ror.org/02qskvh78","country_code":"US","type":"education","lineage":["https://openalex.org/I79272384"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yin Huang","raw_affiliation_strings":["Computer Science and Electrical Engineering, University of Maryland, Baltimore County, Baltimore, MD, 21220","Computer Science and Electrical Engineering, University of Maryland, Baltimore, MD, Baltimore County"],"affiliations":[{"raw_affiliation_string":"Computer Science and Electrical Engineering, University of Maryland, Baltimore County, Baltimore, MD, 21220","institution_ids":["https://openalex.org/I79272384"]},{"raw_affiliation_string":"Computer Science and Electrical Engineering, University of Maryland, Baltimore, MD, Baltimore County","institution_ids":["https://openalex.org/I79272384"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072869372","display_name":"Yelena Yesha","orcid":null},"institutions":[{"id":"https://openalex.org/I79272384","display_name":"University of Maryland, Baltimore County","ror":"https://ror.org/02qskvh78","country_code":"US","type":"education","lineage":["https://openalex.org/I79272384"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yelena Yesha","raw_affiliation_strings":["Computer Science and Electrical Engineering, University of Maryland, Baltimore County, Baltimore, MD, 21220","Computer Science and Electrical Engineering, University of Maryland, Baltimore, MD, Baltimore County"],"affiliations":[{"raw_affiliation_string":"Computer Science and Electrical Engineering, University of Maryland, Baltimore County, Baltimore, MD, 21220","institution_ids":["https://openalex.org/I79272384"]},{"raw_affiliation_string":"Computer Science and Electrical Engineering, University of Maryland, Baltimore, MD, Baltimore County","institution_ids":["https://openalex.org/I79272384"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004628313","display_name":"Milton Halem","orcid":"https://orcid.org/0000-0002-5614-3612"},"institutions":[{"id":"https://openalex.org/I79272384","display_name":"University of Maryland, Baltimore County","ror":"https://ror.org/02qskvh78","country_code":"US","type":"education","lineage":["https://openalex.org/I79272384"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Milton Halem","raw_affiliation_strings":["Computer Science and Electrical Engineering, University of Maryland, Baltimore County, Baltimore, MD, 21220","Computer Science and Electrical Engineering, University of Maryland, Baltimore, MD, Baltimore County"],"affiliations":[{"raw_affiliation_string":"Computer Science and Electrical Engineering, University of Maryland, Baltimore County, Baltimore, MD, 21220","institution_ids":["https://openalex.org/I79272384"]},{"raw_affiliation_string":"Computer Science and Electrical Engineering, University of Maryland, Baltimore, MD, Baltimore County","institution_ids":["https://openalex.org/I79272384"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111941996","display_name":"Yaacov Yesha","orcid":null},"institutions":[{"id":"https://openalex.org/I79272384","display_name":"University of Maryland, Baltimore County","ror":"https://ror.org/02qskvh78","country_code":"US","type":"education","lineage":["https://openalex.org/I79272384"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yaacov Yesha","raw_affiliation_strings":["Computer Science and Electrical Engineering, University of Maryland, Baltimore County, Baltimore, MD, 21220","Computer Science and Electrical Engineering, University of Maryland, Baltimore, MD, Baltimore County"],"affiliations":[{"raw_affiliation_string":"Computer Science and Electrical Engineering, University of Maryland, Baltimore County, Baltimore, MD, 21220","institution_ids":["https://openalex.org/I79272384"]},{"raw_affiliation_string":"Computer Science and Electrical Engineering, University of Maryland, Baltimore, MD, Baltimore County","institution_ids":["https://openalex.org/I79272384"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103531132","display_name":"Shujia Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I79272384","display_name":"University of Maryland, Baltimore County","ror":"https://ror.org/02qskvh78","country_code":"US","type":"education","lineage":["https://openalex.org/I79272384"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shujia Zhou","raw_affiliation_strings":["Computer Science and Electrical Engineering, University of Maryland, Baltimore County, Baltimore, MD, 21220","Computer Science and Electrical Engineering, University of Maryland, Baltimore, MD, Baltimore County"],"affiliations":[{"raw_affiliation_string":"Computer Science and Electrical Engineering, University of Maryland, Baltimore County, Baltimore, MD, 21220","institution_ids":["https://openalex.org/I79272384"]},{"raw_affiliation_string":"Computer Science and Electrical Engineering, University of Maryland, Baltimore, MD, Baltimore County","institution_ids":["https://openalex.org/I79272384"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5109833458"],"corresponding_institution_ids":["https://openalex.org/I79272384"],"apc_list":null,"apc_paid":null,"fwci":1.002,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.84068673,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"214","last_page":"222"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8461209535598755},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.7169731855392456},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6370940804481506},{"id":"https://openalex.org/keywords/nosql","display_name":"NoSQL","score":0.6284056305885315},{"id":"https://openalex.org/keywords/spark","display_name":"SPARK (programming language)","score":0.527593195438385},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.49115726351737976},{"id":"https://openalex.org/keywords/analytics","display_name":"Analytics","score":0.47337645292282104},{"id":"https://openalex.org/keywords/sparse-matrix","display_name":"Sparse matrix","score":0.4716217815876007},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.4664824306964874},{"id":"https://openalex.org/keywords/distributed-memory","display_name":"Distributed memory","score":0.458992063999176},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.45121246576309204},{"id":"https://openalex.org/keywords/computer-cluster","display_name":"Computer cluster","score":0.41799402236938477},{"id":"https://openalex.org/keywords/distributed-file-system","display_name":"Distributed File System","score":0.41603395342826843},{"id":"https://openalex.org/keywords/distributed-database","display_name":"Distributed database","score":0.41580504179000854},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.35650596022605896},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.2809904217720032},{"id":"https://openalex.org/keywords/shared-memory","display_name":"Shared memory","score":0.2583826184272766},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.19117090106010437},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.18514275550842285},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.17149803042411804}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8461209535598755},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.7169731855392456},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6370940804481506},{"id":"https://openalex.org/C2779599972","wikidata":"https://www.wikidata.org/wiki/Q82231","display_name":"NoSQL","level":3,"score":0.6284056305885315},{"id":"https://openalex.org/C2781215313","wikidata":"https://www.wikidata.org/wiki/Q3493345","display_name":"SPARK (programming language)","level":2,"score":0.527593195438385},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.49115726351737976},{"id":"https://openalex.org/C79158427","wikidata":"https://www.wikidata.org/wiki/Q485396","display_name":"Analytics","level":2,"score":0.47337645292282104},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.4716217815876007},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.4664824306964874},{"id":"https://openalex.org/C91481028","wikidata":"https://www.wikidata.org/wiki/Q1054686","display_name":"Distributed memory","level":3,"score":0.458992063999176},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.45121246576309204},{"id":"https://openalex.org/C29140674","wikidata":"https://www.wikidata.org/wiki/Q206637","display_name":"Computer cluster","level":2,"score":0.41799402236938477},{"id":"https://openalex.org/C152043487","wikidata":"https://www.wikidata.org/wiki/Q1229600","display_name":"Distributed File System","level":2,"score":0.41603395342826843},{"id":"https://openalex.org/C70061542","wikidata":"https://www.wikidata.org/wiki/Q989016","display_name":"Distributed database","level":2,"score":0.41580504179000854},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.35650596022605896},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.2809904217720032},{"id":"https://openalex.org/C133875982","wikidata":"https://www.wikidata.org/wiki/Q764810","display_name":"Shared memory","level":2,"score":0.2583826184272766},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.19117090106010437},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.18514275550842285},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.17149803042411804},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.0},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata.2016.7840607","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2016.7840607","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W200298483","https://openalex.org/W1123101191","https://openalex.org/W1973262089","https://openalex.org/W1982767656","https://openalex.org/W2013344760","https://openalex.org/W2013373704","https://openalex.org/W2014168697","https://openalex.org/W2030165200","https://openalex.org/W2038157364","https://openalex.org/W2096544401","https://openalex.org/W2103460560","https://openalex.org/W2112651225","https://openalex.org/W2120458882","https://openalex.org/W2129898896","https://openalex.org/W2131323843","https://openalex.org/W2131975293","https://openalex.org/W2138474206","https://openalex.org/W2153820245","https://openalex.org/W2165874743","https://openalex.org/W2170616854","https://openalex.org/W2190012392","https://openalex.org/W2220625384","https://openalex.org/W4239429564","https://openalex.org/W6607964021","https://openalex.org/W6679524442","https://openalex.org/W6684578312"],"related_works":["https://openalex.org/W2799973158","https://openalex.org/W2419153746","https://openalex.org/W3089119258","https://openalex.org/W2923327995","https://openalex.org/W2518340158","https://openalex.org/W3147331693","https://openalex.org/W349054995","https://openalex.org/W2086537700","https://openalex.org/W2354643924","https://openalex.org/W3152235737"],"abstract_inverted_index":{"Machine":[0],"learning":[1,91],"and":[2,18,30,76,147,177,198,220],"graph":[3],"analytics":[4],"typically":[5],"process":[6],"data":[7,15,43,58,74,97,102,121,161,180,201],"in":[8,26,62,70,112,115],"an":[9],"iterative":[10,89],"way,":[11],"reading":[12,128],"the":[13,23,49,71,95,142,156,159,185,194],"same":[14,96],"multiple":[16,98],"times":[17],"sharing":[19,202],"intermediate":[20,204],"results":[21,207],"across":[22],"worker":[24,108,117],"nodes":[25],"cluster.":[27],"Hadoop":[28,145],"MapReduce":[29,55,151],"Spark":[31,46],"are":[32],"two":[33],"popular":[34],"open":[35],"source":[36],"cluster":[37],"compute":[38],"frameworks":[39],"for":[40,88,104,171,217],"large":[41,172],"scale":[42,225],"analytics.":[44],"Apache":[45],"is":[47,78,85],"currently":[48],"state-of-the-art":[50],"in-memory":[51,138,195],"computation":[52,139,170],"model":[53],"extending":[54],"by":[56,81,149,175],"transforming":[57],"into":[59],"RDDs":[60,113],"stored":[61,114],"memory.":[63],"One":[64],"limitation":[65],"of":[66,158,187,203,222],"Spark,":[67,216],"however,":[68],"lies":[69],"fact":[72],"that":[73,209],"transformation":[75],"distribution":[77],"implicitly":[79],"managed":[80],"HDFS.":[82],"Data":[83],"locality":[84],"not":[86],"guaranteed":[87],"machine":[90],"algorithms":[92],"which":[93],"read":[94],"times.":[99],"For":[100],"example,":[101],"needed":[103],"operations":[105],"to":[106,169,184,215],"one":[107],"node":[109],"might":[110],"reside":[111],"other":[116],"nodes.":[118,189],"The":[119],"resulting":[120],"shuffling":[122],"becomes":[123],"a":[124,134,223],"bottleneck":[125],"when":[126],"iteratively":[127],"such":[129],"RDDs.":[130],"We":[131],"propose":[132],"YinMem,":[133],"parallel":[135],"distributed":[136,160],"indexed":[137,179],"system,":[140],"bridging":[141],"gap":[143],"between":[144],"ecosystem":[146],"HPC":[148],"replacing":[150],"with":[152],"MPI":[153],"while":[154],"obtaining":[155],"advantage":[157],"storage.":[162],"YinMem":[163,190,210],"achieves":[164],"fair":[165],"load":[166],"balancing":[167],"prior":[168],"sparse":[173,226],"matrix":[174],"scheduling":[176],"distributing":[178],"from":[181],"NoSQL":[182],"database":[183],"RAM":[186],"working":[188],"explores":[191],"Alluxio":[192],"as":[193],"storage":[196],"system":[197],"enables":[199],"efficient":[200],"results.":[205],"Preliminary":[206],"show":[208],"has":[211],"achieved":[212],"3\u00d7":[213],"speedup":[214],"computing":[218],"eigenvalue":[219],"eigenvectors":[221],"16-million":[224],"matrix.":[227]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
