{"id":"https://openalex.org/W3212951169","doi":"https://doi.org/10.1109/icccnt51525.2021.9580029","title":"Multiclass Imbalanced Big Data Classification Utilizing Spark Cluster","display_name":"Multiclass Imbalanced Big Data Classification Utilizing Spark Cluster","publication_year":2021,"publication_date":"2021-07-06","ids":{"openalex":"https://openalex.org/W3212951169","doi":"https://doi.org/10.1109/icccnt51525.2021.9580029","mag":"3212951169"},"language":"en","primary_location":{"id":"doi:10.1109/icccnt51525.2021.9580029","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icccnt51525.2021.9580029","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 12th International Conference on Computing Communication and Networking Technologies (ICCCNT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023975871","display_name":"Tinku Singh","orcid":"https://orcid.org/0000-0002-9146-8682"},"institutions":[{"id":"https://openalex.org/I26072440","display_name":"Indian Institute of Information Technology Allahabad","ror":"https://ror.org/03rgjt374","country_code":"IN","type":"education","lineage":["https://openalex.org/I26072440"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Tinku Singh","raw_affiliation_strings":["Indian Institute of Information Technology Allahabad,Department of IT,Prayagraj,India"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Information Technology Allahabad,Department of IT,Prayagraj,India","institution_ids":["https://openalex.org/I26072440"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023761552","display_name":"Riya Khanna","orcid":null},"institutions":[{"id":"https://openalex.org/I26072440","display_name":"Indian Institute of Information Technology Allahabad","ror":"https://ror.org/03rgjt374","country_code":"IN","type":"education","lineage":["https://openalex.org/I26072440"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Riya Khanna","raw_affiliation_strings":["Indian Institute of Information Technology Allahabad,Department of IT,Prayagraj,India"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Information Technology Allahabad,Department of IT,Prayagraj,India","institution_ids":["https://openalex.org/I26072440"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083905410","display_name":"Satakshi","orcid":null},"institutions":[{"id":"https://openalex.org/I168893459","display_name":"University of Allahabad","ror":"https://ror.org/03vrx7m55","country_code":"IN","type":"education","lineage":["https://openalex.org/I168893459"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Satakshi","raw_affiliation_strings":["SHAUTS Allahabad,Department of Maths,U.P.,India"],"affiliations":[{"raw_affiliation_string":"SHAUTS Allahabad,Department of Maths,U.P.,India","institution_ids":["https://openalex.org/I168893459"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5018728658","display_name":"Manish Kumar","orcid":"https://orcid.org/0000-0002-1311-0976"},"institutions":[{"id":"https://openalex.org/I26072440","display_name":"Indian Institute of Information Technology Allahabad","ror":"https://ror.org/03rgjt374","country_code":"IN","type":"education","lineage":["https://openalex.org/I26072440"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Manish Kumar","raw_affiliation_strings":["Indian Institute of Information Technology Allahabad,Department of IT,Prayagraj,India"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Information Technology Allahabad,Department of IT,Prayagraj,India","institution_ids":["https://openalex.org/I26072440"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5023975871"],"corresponding_institution_ids":["https://openalex.org/I26072440"],"apc_list":null,"apc_paid":null,"fwci":0.6798,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.76320286,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13429","display_name":"Electricity Theft Detection Techniques","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11396","display_name":"Artificial Intelligence in Healthcare","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/3605","display_name":"Health Information Management"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.8239604234695435},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7933565378189087},{"id":"https://openalex.org/keywords/spark","display_name":"SPARK (programming language)","score":0.7869086265563965},{"id":"https://openalex.org/keywords/undersampling","display_name":"Undersampling","score":0.6514731049537659},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.6039391160011292},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5659236311912537},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.5532337427139282},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.505160391330719},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4876185953617096},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.4786463975906372},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.4707986116409302},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4468452036380768},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4262917637825012},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.41862404346466064},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3515401780605316}],"concepts":[{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.8239604234695435},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7933565378189087},{"id":"https://openalex.org/C2781215313","wikidata":"https://www.wikidata.org/wiki/Q3493345","display_name":"SPARK (programming language)","level":2,"score":0.7869086265563965},{"id":"https://openalex.org/C136536468","wikidata":"https://www.wikidata.org/wiki/Q1225894","display_name":"Undersampling","level":2,"score":0.6514731049537659},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.6039391160011292},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5659236311912537},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.5532337427139282},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.505160391330719},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4876185953617096},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.4786463975906372},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.4707986116409302},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4468452036380768},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4262917637825012},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.41862404346466064},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3515401780605316},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icccnt51525.2021.9580029","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icccnt51525.2021.9580029","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 12th International Conference on Computing Communication and Networking Technologies (ICCCNT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Life in Land","score":0.6399999856948853,"id":"https://metadata.un.org/sdg/15"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W1930624869","https://openalex.org/W1984323748","https://openalex.org/W2015627422","https://openalex.org/W2095178814","https://openalex.org/W2120240539","https://openalex.org/W2125283600","https://openalex.org/W2135074661","https://openalex.org/W2171647935","https://openalex.org/W2557427388","https://openalex.org/W2597837117","https://openalex.org/W2730240860","https://openalex.org/W2773612851","https://openalex.org/W2780278454","https://openalex.org/W2887451702","https://openalex.org/W2887974490","https://openalex.org/W2911964244","https://openalex.org/W2982160266","https://openalex.org/W3094843711","https://openalex.org/W6640462745"],"related_works":["https://openalex.org/W2545366524","https://openalex.org/W3211874991","https://openalex.org/W2737538696","https://openalex.org/W3176807344","https://openalex.org/W3215678666","https://openalex.org/W4291692947","https://openalex.org/W997111777","https://openalex.org/W4281783369","https://openalex.org/W4231725381","https://openalex.org/W4384300587"],"abstract_inverted_index":{"Because":[0,58],"of":[1,24,28,35,55,59,67,78,128,160,187],"the":[2,22,36,45,60,65,91,126,141,158,161,175],"massive":[3,170],"increase":[4],"in":[5,13,52,81,135,140,157],"data":[6,17,72,83,116,143],"collection":[7],"and":[8,44,114,131],"storage":[9],"that":[10,38],"has":[11,145],"occurred":[12],"recent":[14],"years,":[15],"big":[16,71,123,142],"applications":[18],"are":[19,94],"increasingly":[20],"becoming":[21],"focus":[23],"attention.":[25],"The":[26,165],"difficulty":[27],"classification":[29],"with":[30,121,137,182],"imbalanced":[31,122,138],"datasets":[32,139,171],"is":[33,73,90],"one":[34,87],"complexities":[37],"make":[39],"extracting":[40],"meaningful":[41],"information":[42],"difficult,":[43],"key":[46],"impact":[47],"arises":[48],"from":[49,86,100],"its":[50],"existence":[51],"a":[53,183],"variety":[54,61],"real-world":[56,82],"applications.":[57],"as":[62,64],"well":[63],"veracity":[66],"such":[68],"obtained":[69],"data,":[70],"impacted":[74],"by":[75,98],"an":[76,109],"imbalance":[77],"classes.":[79,102],"Furthermore,":[80,125],"applications,":[84],"samples":[85,99],"class,":[88],"which":[89],"core":[92],"concern,":[93],"frequently":[95],"vastly":[96],"dominated":[97],"other":[101],"In":[103],"this":[104],"study,":[105],"we":[106],"have":[107,150],"proposed":[108,166],"approach":[110],"using":[111],"block-level":[112],"undersampling":[113],"synthetic":[115],"point":[117],"generation":[118],"to":[119,178],"deal":[120],"data.":[124],"performance":[127],"Random":[129],"Forest":[130],"Decision":[132],"Tree":[133],"algorithms":[134],"dealing":[136],"context":[144],"been":[146,151],"evaluated.":[147],"Extensive":[148],"experiments":[149],"performed":[152],"utilizing":[153],"Apache":[154],"Spark":[155],"Cluster":[156],"development":[159],"different":[162],"discussion":[163],"methods.":[164],"technique":[167],"can":[168],"handle":[169],"while":[172],"still":[173],"offering":[174],"assistance":[176],"required":[177],"accurately":[179],"categories":[180],"classes":[181],"comparatively":[184],"less":[185],"number":[186],"instances.":[188]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1}],"updated_date":"2026-01-13T01:12:25.745995","created_date":"2025-10-10T00:00:00"}
