{"id":"https://openalex.org/W2585605463","doi":"https://doi.org/10.1109/bigdata.2016.7840725","title":"Embedding feature selection for large-scale hierarchical classification","display_name":"Embedding feature selection for large-scale hierarchical classification","publication_year":2016,"publication_date":"2016-12-01","ids":{"openalex":"https://openalex.org/W2585605463","doi":"https://doi.org/10.1109/bigdata.2016.7840725","mag":"2585605463"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata.2016.7840725","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2016.7840725","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1706.01581","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5085325081","display_name":"Azad Naik","orcid":"https://orcid.org/0000-0002-9151-6154"},"institutions":[{"id":"https://openalex.org/I162714631","display_name":"George Mason University","ror":"https://ror.org/02jqj7156","country_code":"US","type":"education","lineage":["https://openalex.org/I162714631"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Azad Naik","raw_affiliation_strings":["Department of Computer Science, George Mason University, Fairfax, VA, United States"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, George Mason University, Fairfax, VA, United States","institution_ids":["https://openalex.org/I162714631"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5006581225","display_name":"Huzefa Rangwala","orcid":"https://orcid.org/0000-0003-0435-0035"},"institutions":[{"id":"https://openalex.org/I162714631","display_name":"George Mason University","ror":"https://ror.org/02jqj7156","country_code":"US","type":"education","lineage":["https://openalex.org/I162714631"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Huzefa Rangwala","raw_affiliation_strings":["Department of Computer Science, George Mason University, Fairfax, VA, United States"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, George Mason University, Fairfax, VA, United States","institution_ids":["https://openalex.org/I162714631"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5085325081"],"corresponding_institution_ids":["https://openalex.org/I162714631"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.17182199,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1212","last_page":"1221"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.9750000238418579,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.9750000238418579,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9743000268936157,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9524999856948853,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.7354937791824341},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7180554866790771},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6226789355278015},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6035076975822449},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.5981705188751221},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.5715473294258118},{"id":"https://openalex.org/keywords/dimensionality-reduction","display_name":"Dimensionality reduction","score":0.5686109066009521},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5518273115158081},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5292800068855286},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5202535390853882},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.5090134143829346},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.4944190979003906},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4735504686832428},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4632958173751831},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4197629392147064},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.0800473690032959}],"concepts":[{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.7354937791824341},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7180554866790771},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6226789355278015},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6035076975822449},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.5981705188751221},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.5715473294258118},{"id":"https://openalex.org/C70518039","wikidata":"https://www.wikidata.org/wiki/Q16000077","display_name":"Dimensionality reduction","level":2,"score":0.5686109066009521},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5518273115158081},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5292800068855286},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5202535390853882},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.5090134143829346},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.4944190979003906},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4735504686832428},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4632958173751831},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4197629392147064},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0800473690032959},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/bigdata.2016.7840725","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2016.7840725","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1706.01581","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1706.01581","pdf_url":"https://arxiv.org/pdf/1706.01581","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:2585605463","is_oa":true,"landing_page_url":"http://export.arxiv.org/pdf/1706.01581","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1706.01581","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1706.01581","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1706.01581","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1706.01581","pdf_url":"https://arxiv.org/pdf/1706.01581","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.7200000286102295}],"awards":[{"id":"https://openalex.org/G2186650571","display_name":null,"funder_award_id":"1252318","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G2684336614","display_name":null,"funder_award_id":"1447489","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6894402473","display_name":null,"funder_award_id":"Fellowship","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320309029","display_name":"George Mason University","ror":"https://ror.org/02jqj7156"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2585605463.pdf","grobid_xml":"https://content.openalex.org/works/W2585605463.grobid-xml"},"referenced_works_count":33,"referenced_works":["https://openalex.org/W229800277","https://openalex.org/W1999635750","https://openalex.org/W2005422315","https://openalex.org/W2014566476","https://openalex.org/W2017337590","https://openalex.org/W2023450550","https://openalex.org/W2025047573","https://openalex.org/W2036609757","https://openalex.org/W2063862666","https://openalex.org/W2091669653","https://openalex.org/W2103017472","https://openalex.org/W2111979819","https://openalex.org/W2114535528","https://openalex.org/W2123096872","https://openalex.org/W2131987814","https://openalex.org/W2133462743","https://openalex.org/W2137165876","https://openalex.org/W2150766729","https://openalex.org/W2154053567","https://openalex.org/W2160794449","https://openalex.org/W2168540192","https://openalex.org/W2168606214","https://openalex.org/W2183238986","https://openalex.org/W2963950136","https://openalex.org/W6601706988","https://openalex.org/W6636378376","https://openalex.org/W6639512213","https://openalex.org/W6675138327","https://openalex.org/W6676297131","https://openalex.org/W6680890615","https://openalex.org/W6682304300","https://openalex.org/W6684268674","https://openalex.org/W6758972637"],"related_works":["https://openalex.org/W3037855598","https://openalex.org/W2463985427","https://openalex.org/W2552654392","https://openalex.org/W2594138535","https://openalex.org/W2897768208","https://openalex.org/W2051868889","https://openalex.org/W3210485692","https://openalex.org/W2034562453","https://openalex.org/W267869499","https://openalex.org/W2295985801","https://openalex.org/W2389765312","https://openalex.org/W2792553064","https://openalex.org/W2588792172","https://openalex.org/W2978358790","https://openalex.org/W2993501139","https://openalex.org/W201025399","https://openalex.org/W3212062851","https://openalex.org/W2561308513","https://openalex.org/W1141488758","https://openalex.org/W3023624315"],"abstract_inverted_index":{"Large-scale":[0],"Hierarchical":[1],"Classification":[2],"(HC)":[3],"involves":[4],"datasets":[5,119,136],"consisting":[6],"of":[7,9,13,32,65,71,123,132,148],"thousands":[8],"classes":[10,125],"and":[11,55,82,117,126,137],"millions":[12],"training":[14,49],"instances":[15,127],"with":[16,41,120],"high-dimensional":[17],"features":[18,34],"posing":[19],"several":[20],"big":[21],"data":[22],"challenges.":[23],"Feature":[24],"selection":[25,78,101],"that":[26],"aims":[27],"to":[28,39,79,106],"select":[29],"the":[30,48,52,57,62,72,86,108,145,160],"subset":[31],"discriminant":[33],"is":[35],"an":[36],"effective":[37],"strategy":[38],"deal":[40],"large-scale":[42,109],"HC":[43,110],"problem.":[44,111],"It":[45],"speeds":[46],"up":[47],"process,":[50],"reduces":[51],"prediction":[53],"time":[54],"minimizes":[56],"memory":[58,141],"requirements":[59,142],"by":[60,89],"compressing":[61],"total":[63],"size":[64],"learned":[66,149],"model":[67,150],"weight":[68,146],"vectors.":[69],"Majority":[70],"studies":[73],"have":[74],"also":[75],"shown":[76],"feature":[77,100],"be":[80],"competent":[81],"successful":[83],"in":[84,159],"improving":[85],"classification":[87,161],"accuracy":[88],"removing":[90],"irrelevant":[91],"features.":[92],"In":[93],"this":[94],"work,":[95],"we":[96],"investigate":[97],"various":[98],"filter-based":[99],"methods":[102],"for":[103,143,156],"dimensionality":[104],"reduction":[105],"solve":[107],"Our":[112],"experimental":[113],"evaluation":[114],"on":[115,134],"text":[116],"image":[118],"varying":[121],"distribution":[122],"features,":[124],"shows":[128],"upto":[129,138],"3x":[130],"order":[131],"speed-up":[133],"massive":[135],"45%":[139],"less":[140],"storing":[144],"vectors":[147],"without":[151],"any":[152],"significant":[153],"loss":[154],"(improvement":[155],"some":[157],"datasets)":[158],"accuracy.":[162],"Source":[163],"Code:":[164],"https://cs.gmu.edu/~mlbio/featureselection.":[165]},"counts_by_year":[],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
