{"id":"https://openalex.org/W2177237686","doi":"https://doi.org/10.1186/s13029-015-0045-3","title":"FlexDM: Simple, parallel and fault-tolerant data mining using WEKA","display_name":"FlexDM: Simple, parallel and fault-tolerant data mining using WEKA","publication_year":2015,"publication_date":"2015-11-17","ids":{"openalex":"https://openalex.org/W2177237686","doi":"https://doi.org/10.1186/s13029-015-0045-3","mag":"2177237686","pmid":"https://pubmed.ncbi.nlm.nih.gov/26579209"},"language":"en","primary_location":{"id":"doi:10.1186/s13029-015-0045-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13029-015-0045-3","pdf_url":"https://scfbm.biomedcentral.com/track/pdf/10.1186/s13029-015-0045-3","source":{"id":"https://openalex.org/S45786803","display_name":"Source Code for Biology and Medicine","issn_l":"1751-0473","issn":["1751-0473"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Source Code for Biology and Medicine","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://scfbm.biomedcentral.com/track/pdf/10.1186/s13029-015-0045-3","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017912813","display_name":"Madison Flannery","orcid":null},"institutions":[{"id":"https://openalex.org/I165779595","display_name":"University of Melbourne","ror":"https://ror.org/01ej9dk98","country_code":"AU","type":"education","lineage":["https://openalex.org/I165779595"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Madison Flannery","raw_affiliation_strings":["Systems Biology Laboratory, University of Melbourne, Parkville, 3010 VIC Australia","Systems Biology Laboratory, University of Melbourne, Parkville, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Systems Biology Laboratory, University of Melbourne, Parkville, 3010 VIC Australia","institution_ids":[]},{"raw_affiliation_string":"Systems Biology Laboratory, University of Melbourne, Parkville, Australia","institution_ids":["https://openalex.org/I165779595"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003238807","display_name":"David Budden","orcid":"https://orcid.org/0000-0003-4372-8985"},"institutions":[{"id":"https://openalex.org/I165779595","display_name":"University of Melbourne","ror":"https://ror.org/01ej9dk98","country_code":"AU","type":"education","lineage":["https://openalex.org/I165779595"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"David M. Budden","raw_affiliation_strings":["Systems Biology Laboratory, University of Melbourne, Parkville, 3010 VIC Australia","Systems Biology Laboratory, University of Melbourne, Parkville, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Systems Biology Laboratory, University of Melbourne, Parkville, 3010 VIC Australia","institution_ids":[]},{"raw_affiliation_string":"Systems Biology Laboratory, University of Melbourne, Parkville, Australia","institution_ids":["https://openalex.org/I165779595"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011447378","display_name":"Alexandre Mendes","orcid":"https://orcid.org/0000-0003-1759-3765"},"institutions":[{"id":"https://openalex.org/I78757542","display_name":"University of Newcastle Australia","ror":"https://ror.org/00eae9z71","country_code":"AU","type":"education","lineage":["https://openalex.org/I78757542"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Alexandre Mendes","raw_affiliation_strings":["School of Electrical Engineering and Computer Science, The University of Newcastle, Callaghan, 2308 NSW Australia","School of Electrical Engineering and Computer Science, The University of Newcastle, Callaghan, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, The University of Newcastle, Callaghan, 2308 NSW Australia","institution_ids":[]},{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, The University of Newcastle, Callaghan, Australia","institution_ids":["https://openalex.org/I78757542"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5011447378"],"corresponding_institution_ids":["https://openalex.org/I78757542"],"apc_list":null,"apc_paid":null,"fwci":0.8177,"has_fulltext":true,"cited_by_count":7,"citation_normalized_percentile":{"value":0.84427038,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"10","issue":"1","first_page":"13","last_page":"13"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.21809999644756317,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.21809999644756317,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.18019999563694,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10885","display_name":"Gene expression and cancer classification","score":0.13269999623298645,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8577017784118652},{"id":"https://openalex.org/keywords/xml","display_name":"XML","score":0.5698708891868591},{"id":"https://openalex.org/keywords/extensibility","display_name":"Extensibility","score":0.5179187655448914},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.5039681792259216},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4967206120491028},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.4930371940135956},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.35329681634902954},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.21862995624542236},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1928173303604126}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8577017784118652},{"id":"https://openalex.org/C8797682","wikidata":"https://www.wikidata.org/wiki/Q2115","display_name":"XML","level":2,"score":0.5698708891868591},{"id":"https://openalex.org/C32833848","wikidata":"https://www.wikidata.org/wiki/Q4115054","display_name":"Extensibility","level":2,"score":0.5179187655448914},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.5039681792259216},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4967206120491028},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.4930371940135956},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35329681634902954},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.21862995624542236},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1928173303604126}],"mesh":[],"locations_count":6,"locations":[{"id":"doi:10.1186/s13029-015-0045-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13029-015-0045-3","pdf_url":"https://scfbm.biomedcentral.com/track/pdf/10.1186/s13029-015-0045-3","source":{"id":"https://openalex.org/S45786803","display_name":"Source Code for Biology and Medicine","issn_l":"1751-0473","issn":["1751-0473"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Source Code for Biology and Medicine","raw_type":"journal-article"},{"id":"pmid:26579209","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/26579209","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Source code for biology and medicine","raw_type":null},{"id":"pmh:oai:jupiter.its.unimelb.edu.au:11343/59494","is_oa":true,"landing_page_url":"http://hdl.handle.net/11343/59494","pdf_url":"http://hdl.handle.net/11343/59494","source":{"id":"https://openalex.org/S4377196259","display_name":"Minerva Access (University of Melbourne)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I165779595","host_organization_name":"The University of Melbourne","host_organization_lineage":["https://openalex.org/I165779595"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Journal Article"},{"id":"pmh:oai:europepmc.org:3619184","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/4647584","pdf_url":null,"source":{"id":"https://openalex.org/S4306400806","display_name":"Europe PMC (PubMed Central)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1303153112","host_organization_name":"European Bioinformatics Institute","host_organization_lineage":["https://openalex.org/I1303153112"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Text"},{"id":"pmh:oai:figshare.com:article/28963862","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Journal contribution"},{"id":"pmh:uon:22675","is_oa":false,"landing_page_url":"http://hdl.handle.net/1959.13/1313968","pdf_url":null,"source":{"id":"https://openalex.org/S4306401391","display_name":"NOVA (University of Newcastle, Australia)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I78757542","host_organization_name":"University of Newcastle Australia","host_organization_lineage":["https://openalex.org/I78757542"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"journal article"}],"best_oa_location":{"id":"doi:10.1186/s13029-015-0045-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13029-015-0045-3","pdf_url":"https://scfbm.biomedcentral.com/track/pdf/10.1186/s13029-015-0045-3","source":{"id":"https://openalex.org/S45786803","display_name":"Source Code for Biology and Medicine","issn_l":"1751-0473","issn":["1751-0473"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Source Code for Biology and Medicine","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.46000000834465027,"display_name":"Decent work and economic growth","id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320320963","display_name":"University of Newcastle Australia","ror":"https://ror.org/00eae9z71"},{"id":"https://openalex.org/F4320320974","display_name":"University of Melbourne","ror":"https://ror.org/01ej9dk98"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2177237686.pdf","grobid_xml":"https://content.openalex.org/works/W2177237686.grobid-xml"},"referenced_works_count":9,"referenced_works":["https://openalex.org/W1560051613","https://openalex.org/W1566376227","https://openalex.org/W2000515602","https://openalex.org/W2062076898","https://openalex.org/W2113604695","https://openalex.org/W2133990480","https://openalex.org/W2146437022","https://openalex.org/W2163592640","https://openalex.org/W3104276456"],"related_works":["https://openalex.org/W2364420803","https://openalex.org/W25068511","https://openalex.org/W2362760518","https://openalex.org/W2368425793","https://openalex.org/W4253241429","https://openalex.org/W2370256962","https://openalex.org/W1492726150","https://openalex.org/W2362738498","https://openalex.org/W2382693809","https://openalex.org/W1997653423"],"abstract_inverted_index":{"BACKGROUND:":[0],"With":[1],"the":[2,62,83,128,197,203,214,251],"continued":[3],"exponential":[4],"growth":[5],"in":[6,71,139,179,265],"data":[7,10,209,259,278],"volume,":[8],"large-scale":[9,258],"mining":[11,260],"and":[12,41,51,90,117,130,170,193,206,228,232,244,284],"machine":[13,262],"learning":[14,263],"experiments":[15,97],"have":[16],"become":[17],"a":[18,35,55,88,99,114,136,142,159,176,191,236,282],"necessity":[19],"for":[20,31,141,241],"many":[21],"researchers":[22],"without":[23],"programming":[24],"or":[25,110,261],"statistics":[26],"backgrounds.":[27],"WEKA":[28,63,84,132,198],"(Waikato":[29],"Environment":[30],"Knowledge":[32],"Analysis)":[33],"is":[34,190,233],"gold":[36],"standard":[37],"framework":[38],"that":[39,68,144,210],"facilitates":[40],"simplifies":[42],"this":[43],"task":[44],"by":[45,167],"allowing":[46],"specification":[47,143],"of":[48,102,148,153,173,208,253,276],"algorithms,":[49],"hyper-parameters":[50],"test":[52],"strategies":[53],"from":[54,108],"streamlined":[56],"Experimenter":[57,64],"GUI.":[58],"Despite":[59],"its":[60],"popularity,":[61],"exhibits":[65],"several":[66],"limitations":[67,81],"we":[69],"address":[70],"our":[72],"new":[73],"FlexDM":[74,77,129,154,189,221],"software.":[75],"RESULTS:":[76],"addresses":[78],"four":[79],"fundamental":[80],"with":[82,270],"Experimenter:":[85],"reliance":[86],"on":[87,158,225],"verbose":[89],"difficult-to-modify":[91],"XML":[92,133,286],"schema;":[93],"inability":[94,105],"to":[95,106,119,196,267],"meta-optimise":[96],"over":[98,273],"large":[100,115,160],"number":[101],"algorithm":[103],"hyper-parameters;":[104],"recover":[107],"software":[109,247],"hardware":[111],"failure":[112],"during":[113,213],"experiment;":[116],"failing":[118],"leverage":[120],"modern":[121],"multicore":[122],"processor":[123,186],"architectures.":[124],"Direct":[125],"comparisons":[126],"between":[127],"default":[131],"schemas":[134],"demonstrate":[135],"10-fold":[137],"improvement":[138],"brevity":[140],"allows":[145],"finer":[146],"control":[147,272],"experimental":[149],"procedures.":[150],"The":[151],"stability":[152],"has":[155,211,222],"been":[156,223],"tested":[157,224],"biological":[161],"dataset":[162],"(approximately":[163],"450":[164],"k":[165],"attributes":[166],"150":[168],"samples),":[169],"automatic":[171],"parallelisation":[172],"tasks":[174],"yields":[175],"quasi-linear":[177],"reduction":[178],"execution":[180],"time":[181],"when":[182],"distributed":[183],"across":[184],"multiple":[185],"cores.":[187],"CONCLUSION:":[188],"powerful":[192],"easy-to-use":[194],"extension":[195],"package,":[199],"which":[200],"better":[201],"handles":[202],"increased":[204],"volume":[205],"complexity":[207],"emerged":[212],"20":[215],"years":[216],"since":[217],"WEKA's":[218],"original":[219],"development.":[220],"Windows,":[226],"OSX":[227],"Linux":[229],"operating":[230],"systems":[231],"provided":[234],"as":[235],"pre-configured":[237],"virtual":[238],"reference":[239],"environment":[240],"trivial":[242],"usage":[243],"extensibility.":[245],"This":[246],"can":[248],"substantially":[249],"improve":[250],"productivity":[252],"any":[254],"research":[255],"group":[256],"conducting":[257],"tasks,":[264],"addition":[266],"providing":[268],"non-programmers":[269],"improved":[271],"specific":[274],"aspects":[275],"their":[277],"analysis":[279],"pipeline":[280],"via":[281],"succinct":[283],"simplified":[285],"schema.":[287]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1}],"updated_date":"2026-04-29T09:16:38.111599","created_date":"2025-10-10T00:00:00"}
