{"id":"https://openalex.org/W4206952331","doi":"https://doi.org/10.1109/ssci50451.2021.9659937","title":"Distributed Ensemble Feature Selection Framework for High-Dimensional and High-Skewed Imbalanced Big Dataset","display_name":"Distributed Ensemble Feature Selection Framework for High-Dimensional and High-Skewed Imbalanced Big Dataset","publication_year":2021,"publication_date":"2021-12-05","ids":{"openalex":"https://openalex.org/W4206952331","doi":"https://doi.org/10.1109/ssci50451.2021.9659937"},"language":"en","primary_location":{"id":"doi:10.1109/ssci50451.2021.9659937","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ssci50451.2021.9659937","pdf_url":null,"source":{"id":"https://openalex.org/S4363604921","display_name":"2021 IEEE Symposium Series on Computational Intelligence (SSCI)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE Symposium Series on Computational Intelligence (SSCI)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://ris.utwente.nl/ws/files/278040097/10.1109_ssci50451.2021.9659937.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010857378","display_name":"Majid Soheili","orcid":"https://orcid.org/0000-0002-9689-6184"},"institutions":[{"id":"https://openalex.org/I110525433","display_name":"Islamic Azad University, Tehran","ror":"https://ror.org/01kzn7k21","country_code":"IR","type":"education","lineage":["https://openalex.org/I110525433"]}],"countries":["IR"],"is_corresponding":false,"raw_author_name":"Majid Soheili","raw_affiliation_strings":["Islamic Azad University, Neka, Iran"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Islamic Azad University, Neka, Iran","institution_ids":["https://openalex.org/I110525433"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5054681389","display_name":"Maryam Amir Haeri","orcid":"https://orcid.org/0000-0002-9638-9481"},"institutions":[{"id":"https://openalex.org/I94624287","display_name":"University of Twente","ror":"https://ror.org/006hf6230","country_code":"NL","type":"education","lineage":["https://openalex.org/I94624287"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Maryam Amir Amir Haeri","raw_affiliation_strings":["University of Twente, Enschede, Netherlands"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Twente, Enschede, Netherlands","institution_ids":["https://openalex.org/I94624287"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.2537,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.5349353,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9918000102043152,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13429","display_name":"Electricity Theft Detection Techniques","score":0.9878000020980835,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.772253155708313},{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.717939555644989},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6723438501358032},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5852060317993164},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5647971630096436},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5629962682723999},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5615895986557007},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.5576090812683105},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.5043588876724243},{"id":"https://openalex.org/keywords/ensemble-learning","display_name":"Ensemble learning","score":0.5012781620025635},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.41331297159194946},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.08076292276382446}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.772253155708313},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.717939555644989},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6723438501358032},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5852060317993164},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5647971630096436},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5629962682723999},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5615895986557007},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.5576090812683105},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.5043588876724243},{"id":"https://openalex.org/C45942800","wikidata":"https://www.wikidata.org/wiki/Q245652","display_name":"Ensemble learning","level":2,"score":0.5012781620025635},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.41331297159194946},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.08076292276382446},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/ssci50451.2021.9659937","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ssci50451.2021.9659937","pdf_url":null,"source":{"id":"https://openalex.org/S4363604921","display_name":"2021 IEEE Symposium Series on Computational Intelligence (SSCI)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE Symposium Series on Computational Intelligence (SSCI)","raw_type":"proceedings-article"},{"id":"pmh:oai:ris.utwente.nl:openaire/624d459f-6139-47ed-9f8f-468eca7c809c","is_oa":true,"landing_page_url":"https://research.utwente.nl/en/publications/624d459f-6139-47ed-9f8f-468eca7c809c","pdf_url":"https://ris.utwente.nl/ws/files/278040097/10.1109_ssci50451.2021.9659937.pdf","source":{"id":"https://openalex.org/S4406922991","display_name":"University of Twente Research Information","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Soheili, M & Haeri, M A 2022, Distributed Ensemble Feature Selection Framework for High-Dimensional and High-Skewed Imbalanced Big Dataset. in 2021 IEEE Symposium Series on Computational Intelligence, SSCI 2021 - Proceedings. 2021 IEEE Symposium Series on Computational Intelligence, SSCI 2021 - Proceedings, IEEE, 2021 IEEE Symposium Series on Computational Intelligence, SSCI 2021, Orlando, United States, 5/12/21. https://doi.org/10.1109/SSCI50451.2021.9659937","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:ris.utwente.nl:publications/624d459f-6139-47ed-9f8f-468eca7c809c","is_oa":true,"landing_page_url":"http://www.scopus.com/inward/record.url?scp=85125784570&partnerID=8YFLogxK","pdf_url":null,"source":{"id":"https://openalex.org/S4406922991","display_name":"University of Twente Research Information","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Soheili , M &amp; Haeri , M A 2022 , Distributed Ensemble Feature Selection Framework for High-Dimensional and High-Skewed Imbalanced Big Dataset . in 2021 IEEE Symposium Series on Computational Intelligence, SSCI 2021 - Proceedings . 2021 IEEE Symposium Series on Computational Intelligence, SSCI 2021 - Proceedings , IEEE , 2021 IEEE Symposium Series on Computational Intelligence, SSCI 2021 , Orlando , United States , 5/12/21 . https://doi.org/10.1109/SSCI50451.2021.9659937","raw_type":"contributionToPeriodical"}],"best_oa_location":{"id":"pmh:oai:ris.utwente.nl:openaire/624d459f-6139-47ed-9f8f-468eca7c809c","is_oa":true,"landing_page_url":"https://research.utwente.nl/en/publications/624d459f-6139-47ed-9f8f-468eca7c809c","pdf_url":"https://ris.utwente.nl/ws/files/278040097/10.1109_ssci50451.2021.9659937.pdf","source":{"id":"https://openalex.org/S4406922991","display_name":"University of Twente Research Information","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Soheili, M & Haeri, M A 2022, Distributed Ensemble Feature Selection Framework for High-Dimensional and High-Skewed Imbalanced Big Dataset. in 2021 IEEE Symposium Series on Computational Intelligence, SSCI 2021 - Proceedings. 2021 IEEE Symposium Series on Computational Intelligence, SSCI 2021 - Proceedings, IEEE, 2021 IEEE Symposium Series on Computational Intelligence, SSCI 2021, Orlando, United States, 5/12/21. https://doi.org/10.1109/SSCI50451.2021.9659937","raw_type":"info:eu-repo/semantics/publishedVersion"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4206952331.pdf","grobid_xml":"https://content.openalex.org/works/W4206952331.grobid-xml"},"referenced_works_count":28,"referenced_works":["https://openalex.org/W212002884","https://openalex.org/W1429921896","https://openalex.org/W1808644423","https://openalex.org/W1968985250","https://openalex.org/W1975664724","https://openalex.org/W1989133258","https://openalex.org/W2052586313","https://openalex.org/W2119869458","https://openalex.org/W2171647935","https://openalex.org/W2408874603","https://openalex.org/W2475596014","https://openalex.org/W2524620548","https://openalex.org/W2537734429","https://openalex.org/W2611743072","https://openalex.org/W2727672833","https://openalex.org/W2752946155","https://openalex.org/W2755474412","https://openalex.org/W2785172785","https://openalex.org/W2899274556","https://openalex.org/W2910351322","https://openalex.org/W2948009788","https://openalex.org/W2995013516","https://openalex.org/W3083914941","https://openalex.org/W3101080475","https://openalex.org/W3105313435","https://openalex.org/W3121333339","https://openalex.org/W3133896312","https://openalex.org/W3160385040"],"related_works":["https://openalex.org/W4390608645","https://openalex.org/W4247566972","https://openalex.org/W4394895745","https://openalex.org/W2960264696","https://openalex.org/W3090563135","https://openalex.org/W2497432351","https://openalex.org/W4206777497","https://openalex.org/W2910064364","https://openalex.org/W4200136508","https://openalex.org/W2499527417"],"abstract_inverted_index":{"The":[0,146,222],"class-imbalance":[1],"problem":[2],"emerges":[3],"when":[4],"the":[5,18,27,34,64,67,77,91,95,115,124,227],"class":[6],"labels":[7],"of":[8,66,74,123],"a":[9,12,72,131,158,164,169,183,219],"dataset":[10],"have":[11,234],"skewed":[13],"distribution.":[14],"In":[15,40,186],"this":[16,187],"circumstance,":[17],"instances":[19,35],"belonging":[20,36],"to":[21,37,62,84,109,140,154],"one":[22,96],"class,":[23],"which":[24,106],"is":[25,107,119],"exactly":[26],"principal":[28],"purpose,":[29],"are":[30,103,197,207,210,230],"dominated":[31],"thoroughly":[32],"by":[33],"other":[38,116],"classes.":[39],"recent":[41],"years,":[42],"feature":[43,60,75,78,100,135,165,180,191],"selection":[44,101,136],"for":[45],"high-dimensional":[46],"imbalanced":[47,144,215],"data":[48,152],"has":[49,81],"become":[50],"attraction":[51],"research":[52],"scope.":[53],"This":[54,128],"technique":[55,80],"concerns":[56],"selecting":[57],"an":[58,120],"informative":[59],"set":[61],"improve":[63],"accuracy":[65],"classification":[68,245],"model.":[69],"Moreover,":[70],"as":[71],"subcategory":[73],"selection,":[76],"ranking":[79,166,192],"been":[82],"deliberated":[83],"cope":[85,110],"with":[86,111,142],"high":[87],"-dimensional":[88],"datasets":[89,216],"in":[90,157,168,182],"last":[92],"decade.":[93],"On":[94,114],"hand,":[97,117],"most":[98],"traditional":[99,190],"methods":[102,203,229],"not":[104],"scalable,":[105],"critical":[108],"large-scale":[112],"datasets.":[113,145],"scalability":[118],"intrinsic":[121],"characteristic":[122],"ensemble":[125],"learning":[126],"approach.":[127],"paper":[129],"proposes":[130],"Distributed":[132],"Ensemble":[133],"Imbalanced":[134],"framework,":[137],"called":[138],"DEIM,":[139,147],"deal":[141],"big":[143,214],"at":[148],"first,":[149],"transforms":[150],"default":[151],"partitions":[153,156],"representative":[155],"single":[159],"pass.":[160],"Second,":[161],"it":[162],"applies":[163],"method":[167],"bagging":[170],"approach":[171],"upon":[172,218],"each":[173],"partition":[174],"independently.":[175],"Finally,":[176],"It":[177],"fuses":[178],"intermediate":[179],"rankings":[181],"stacking":[184],"strategy.":[185],"paper,":[188],"two":[189,202],"algorithms,":[193],"ReliefF":[194],"and":[195,205,217,238,249],"QPFS,":[196],"plugged":[198],"into":[199],"DEIM.":[200],"Therefore,":[201],"DEIM-Relief":[204],"DEIM-QPFS,":[206],"produced.":[208],"Experiments":[209],"accomplished":[211],"on":[212],"three":[213],"computer":[220],"cluster.":[221],"empirical":[223],"study":[224],"depicts":[225],"that":[226],"produced":[228],"scalable.":[231],"Also,":[232],"they":[233],"lower":[235],"execution":[236],"times,":[237],"their":[239],"final":[240],"results":[241],"can":[242],"induce":[243],"better":[244],"models":[246],"than":[247],"DiReliefF":[248],"DQPFS.":[250]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
