{"id":"https://openalex.org/W2927733588","doi":"https://doi.org/10.1186/s40537-019-0186-3","title":"Selecting a representative decision tree from an ensemble of decision-tree models for fast big data classification","display_name":"Selecting a representative decision tree from an ensemble of decision-tree models for fast big data classification","publication_year":2019,"publication_date":"2019-02-28","ids":{"openalex":"https://openalex.org/W2927733588","doi":"https://doi.org/10.1186/s40537-019-0186-3","mag":"2927733588"},"language":"en","primary_location":{"id":"doi:10.1186/s40537-019-0186-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-019-0186-3","pdf_url":"https://journalofbigdata.springeropen.com/track/pdf/10.1186/s40537-019-0186-3","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://journalofbigdata.springeropen.com/track/pdf/10.1186/s40537-019-0186-3","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037956466","display_name":"Abraham Itzhak Weinberg","orcid":"https://orcid.org/0000-0002-2505-9653"},"institutions":[{"id":"https://openalex.org/I124227911","display_name":"Ben-Gurion University of the Negev","ror":"https://ror.org/05tkyf982","country_code":"IL","type":"education","lineage":["https://openalex.org/I124227911"]}],"countries":["IL"],"is_corresponding":true,"raw_author_name":"Abraham Itzhak Weinberg","raw_affiliation_strings":["Department of Software and Information Systems Engineering, Ben-Gurion University of the Negev, BeerSheba, Israel"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Software and Information Systems Engineering, Ben-Gurion University of the Negev, BeerSheba, Israel","institution_ids":["https://openalex.org/I124227911"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066910344","display_name":"Mark Last","orcid":"https://orcid.org/0000-0003-0748-7918"},"institutions":[{"id":"https://openalex.org/I124227911","display_name":"Ben-Gurion University of the Negev","ror":"https://ror.org/05tkyf982","country_code":"IL","type":"education","lineage":["https://openalex.org/I124227911"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Mark Last","raw_affiliation_strings":["Department of Software and Information Systems Engineering, Ben-Gurion University of the Negev, BeerSheba, Israel"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Software and Information Systems Engineering, Ben-Gurion University of the Negev, BeerSheba, Israel","institution_ids":["https://openalex.org/I124227911"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5037956466"],"corresponding_institution_ids":["https://openalex.org/I124227911"],"apc_list":{"value":1060,"currency":"GBP","value_usd":1300},"apc_paid":{"value":1060,"currency":"GBP","value_usd":1300},"fwci":3.4843,"has_fulltext":true,"cited_by_count":49,"citation_normalized_percentile":{"value":0.94120352,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"6","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/c4.5-algorithm","display_name":"C4.5 algorithm","score":0.7776401042938232},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7494809627532959},{"id":"https://openalex.org/keywords/decision-tree","display_name":"Decision tree","score":0.6707097887992859},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.6070290803909302},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5431131720542908},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5176059007644653},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.510218620300293},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.49318093061447144},{"id":"https://openalex.org/keywords/ensemble-learning","display_name":"Ensemble learning","score":0.47078365087509155},{"id":"https://openalex.org/keywords/majority-rule","display_name":"Majority rule","score":0.46341246366500854},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.44996023178100586},{"id":"https://openalex.org/keywords/ensemble-forecasting","display_name":"Ensemble forecasting","score":0.42984092235565186},{"id":"https://openalex.org/keywords/decision-tree-model","display_name":"Decision tree model","score":0.41331204771995544},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.32820576429367065},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.2623484134674072},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.20706823468208313},{"id":"https://openalex.org/keywords/naive-bayes-classifier","display_name":"Naive Bayes classifier","score":0.13001245260238647}],"concepts":[{"id":"https://openalex.org/C52003472","wikidata":"https://www.wikidata.org/wiki/Q1022655","display_name":"C4.5 algorithm","level":4,"score":0.7776401042938232},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7494809627532959},{"id":"https://openalex.org/C84525736","wikidata":"https://www.wikidata.org/wiki/Q831366","display_name":"Decision tree","level":2,"score":0.6707097887992859},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.6070290803909302},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5431131720542908},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5176059007644653},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.510218620300293},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.49318093061447144},{"id":"https://openalex.org/C45942800","wikidata":"https://www.wikidata.org/wiki/Q245652","display_name":"Ensemble learning","level":2,"score":0.47078365087509155},{"id":"https://openalex.org/C153668964","wikidata":"https://www.wikidata.org/wiki/Q27636","display_name":"Majority rule","level":2,"score":0.46341246366500854},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.44996023178100586},{"id":"https://openalex.org/C119898033","wikidata":"https://www.wikidata.org/wiki/Q3433888","display_name":"Ensemble forecasting","level":2,"score":0.42984092235565186},{"id":"https://openalex.org/C56289965","wikidata":"https://www.wikidata.org/wiki/Q5249246","display_name":"Decision tree model","level":3,"score":0.41331204771995544},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32820576429367065},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.2623484134674072},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.20706823468208313},{"id":"https://openalex.org/C52001869","wikidata":"https://www.wikidata.org/wiki/Q812530","display_name":"Naive Bayes classifier","level":3,"score":0.13001245260238647},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1186/s40537-019-0186-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-019-0186-3","pdf_url":"https://journalofbigdata.springeropen.com/track/pdf/10.1186/s40537-019-0186-3","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:b45835779e044e8b959e5969b52be442","is_oa":true,"landing_page_url":"https://doaj.org/article/b45835779e044e8b959e5969b52be442","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of Big Data, Vol 6, Iss 1, Pp 1-17 (2019)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/s40537-019-0186-3","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-019-0186-3","pdf_url":"https://journalofbigdata.springeropen.com/track/pdf/10.1186/s40537-019-0186-3","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.800000011920929}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2927733588.pdf","grobid_xml":"https://content.openalex.org/works/W2927733588.grobid-xml"},"referenced_works_count":41,"referenced_works":["https://openalex.org/W216882981","https://openalex.org/W866281365","https://openalex.org/W1483135265","https://openalex.org/W1489069776","https://openalex.org/W1562463424","https://openalex.org/W1575085314","https://openalex.org/W1576962511","https://openalex.org/W1581797854","https://openalex.org/W1588100052","https://openalex.org/W1598873931","https://openalex.org/W1959511748","https://openalex.org/W1976373002","https://openalex.org/W1981276685","https://openalex.org/W1981325283","https://openalex.org/W1991137221","https://openalex.org/W2002579649","https://openalex.org/W2003889154","https://openalex.org/W2009537245","https://openalex.org/W2033139852","https://openalex.org/W2048231652","https://openalex.org/W2068714596","https://openalex.org/W2072755970","https://openalex.org/W2074726512","https://openalex.org/W2075877598","https://openalex.org/W2087295784","https://openalex.org/W2091801169","https://openalex.org/W2105175890","https://openalex.org/W2125816831","https://openalex.org/W2128073546","https://openalex.org/W2129288417","https://openalex.org/W2131851440","https://openalex.org/W2135293965","https://openalex.org/W2141083048","https://openalex.org/W2152837238","https://openalex.org/W2691984185","https://openalex.org/W2782681843","https://openalex.org/W2809089185","https://openalex.org/W2911964244","https://openalex.org/W3106409770","https://openalex.org/W4244174440","https://openalex.org/W6630437497"],"related_works":["https://openalex.org/W4386883672","https://openalex.org/W2794896638","https://openalex.org/W1807784185","https://openalex.org/W3110815158","https://openalex.org/W3202800081","https://openalex.org/W1909207154","https://openalex.org/W3124390867","https://openalex.org/W2416142762","https://openalex.org/W3101614107","https://openalex.org/W2979309038"],"abstract_inverted_index":{"The":[0,56,129,187],"goal":[1],"of":[2,12,22,24,52,74,94,98,156,190,221],"this":[3,79],"paper":[4],"is":[5,43,59,195],"to":[6,46,83,91,124,161,236],"reduce":[7],"the":[8,30,36,40,49,53,75,92,99,112,115,121,166,181,184,208,218,222,228,231,239,244],"classification":[9,254],"(inference)":[10],"complexity":[11],"tree":[13,80,108,113],"ensembles":[14],"by":[15,225,243],"choosing":[16,96,111],"a":[17,66,68,71,84,175,248],"single":[18],"representative":[19,51,127,240],"model":[20],"out":[21],"ensemble":[23,37,86,123,237],"multiple":[25],"decision-tree":[26,142],"models.":[27,101],"We":[28,77],"compute":[29],"similarity":[31,64,168],"between":[32,217],"different":[33,63,154],"models":[34,241],"in":[35],"and":[38,70,90,119,145,147,183,201,227,260],"choose":[39],"model,":[41],"which":[42],"most":[44,126,164],"similar":[45],"others":[47],"as":[48],"best":[50],"entire":[54],"dataset.":[55],"similarity-based":[57],"approach":[58],"implemented":[60],"with":[61,256],"three":[62],"metrics:":[65],"syntactic,":[67],"semantic,":[69],"linear":[72],"combination":[73],"two.":[76],"compare":[78],"selection":[81,109],"methodology":[82],"popular":[85,141],"algorithm":[87],"(majority":[88],"voting)":[89],"baseline":[93],"randomly":[95],"one":[97],"local":[100],"In":[102,163],"addition,":[103],"we":[104,211],"evaluate":[105],"two":[106,140],"alternative":[107],"strategies:":[110],"having":[114,230],"highest":[116,232],"validation":[117,233],"accuracy":[118,179,189,220],"reducing":[120],"original":[122],"five":[125],"trees.":[128],"comparative":[130],"evaluation":[131],"experiments":[132],"are":[133],"performed":[134],"on":[135],"six":[136,153],"big":[137,252],"datasets":[138,194],"using":[139],"algorithms":[143],"(J48":[144],"CART)":[146],"splitting":[148],"each":[149],"dataset":[150],"horizontally":[151],"into":[152],"amounts":[155],"equal-size":[157],"slices":[158],"(from":[159],"32":[160],"1024).":[162],"experiments,":[165],"syntactic":[167],"approach,":[169],"named":[170],"SySM\u2014Syntactic":[171],"Similarity":[172],"Method,":[173],"provides":[174],"significantly":[176],"higher":[177,249],"testing":[178,219],"than":[180],"semantic":[182],"combined":[185],"ones.":[186],"mean":[188],"SySM":[191,226],"over":[192],"all":[193],"$${0.835}":[196],"\\pm":[197,203],"{0.065}$$":[198],"for":[199,205,251],"CART":[200],"$${0.769}":[202],"{0.066}$$":[204],"J48.":[206],"On":[207],"other":[209],"hand,":[210],"find":[212],"no":[213],"statistically":[214],"significant":[215],"difference":[216],"trees":[223,229],"selected":[224,242],"accuracy.":[234],"Comparing":[235],"algorithms,":[238],"proposed":[245],"methods":[246],"provide":[247],"speed":[250],"data":[253],"along":[255],"being":[257],"more":[258],"compact":[259],"interpretable.":[261]},"counts_by_year":[{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":11},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":4}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
