{"id":"https://openalex.org/W3145855438","doi":"https://doi.org/10.31577/cai_2020_5_881","title":"Optimal Feature Subset Selection Based on Combining Document Frequency and Term Frequency for Text Classification","display_name":"Optimal Feature Subset Selection Based on Combining Document Frequency and Term Frequency for Text Classification","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3145855438","doi":"https://doi.org/10.31577/cai_2020_5_881","mag":"3145855438"},"language":"en","primary_location":{"id":"doi:10.31577/cai_2020_5_881","is_oa":true,"landing_page_url":"https://doi.org/10.31577/cai_2020_5_881","pdf_url":"http://www.cai.sk/ojs/index.php/cai/article/download/2020_5_881/1052","source":{"id":"https://openalex.org/S4210200093","display_name":"Computing and Informatics","issn_l":"1335-9150","issn":["1335-9150","2585-8807"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computing and Informatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"http://www.cai.sk/ojs/index.php/cai/article/download/2020_5_881/1052","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086210026","display_name":"K Thirumoorthy","orcid":"https://orcid.org/0000-0001-8107-5183"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Thirumoorthy Karpagalingam","raw_affiliation_strings":["Department of Computer Science and Engineering, Mepco Schlenk Engineering College, Sivakasi, Tamilnadu, India"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Mepco Schlenk Engineering College, Sivakasi, Tamilnadu, India","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5029382525","display_name":"Muneeswaran Karuppaiah","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Muneeswaran Karuppaiah","raw_affiliation_strings":["Department of Computer Science and Engineering, Mepco Schlenk Engineering College, Sivakasi, Tamilnadu, India"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Mepco Schlenk Engineering College, Sivakasi, Tamilnadu, India","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5086210026"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.2718,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.6714769,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"39","issue":"5","first_page":"881","last_page":"906"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9627000093460083,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9627000093460083,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.7759464979171753},{"id":"https://openalex.org/keywords/naive-bayes-classifier","display_name":"Naive Bayes classifier","score":0.7241520881652832},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6612460017204285},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.653388500213623},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.621875524520874},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5984602570533752},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.5403793454170227},{"id":"https://openalex.org/keywords/dimensionality-reduction","display_name":"Dimensionality reduction","score":0.5397196412086487},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.48105955123901367},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.46317583322525024},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4569575786590576},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.44633233547210693},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.441936194896698},{"id":"https://openalex.org/keywords/linear-classifier","display_name":"Linear classifier","score":0.41098320484161377},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.41080614924430847},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.36782586574554443},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.13177627325057983}],"concepts":[{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.7759464979171753},{"id":"https://openalex.org/C52001869","wikidata":"https://www.wikidata.org/wiki/Q812530","display_name":"Naive Bayes classifier","level":3,"score":0.7241520881652832},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6612460017204285},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.653388500213623},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.621875524520874},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5984602570533752},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.5403793454170227},{"id":"https://openalex.org/C70518039","wikidata":"https://www.wikidata.org/wiki/Q16000077","display_name":"Dimensionality reduction","level":2,"score":0.5397196412086487},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.48105955123901367},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.46317583322525024},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4569575786590576},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.44633233547210693},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.441936194896698},{"id":"https://openalex.org/C139532973","wikidata":"https://www.wikidata.org/wiki/Q2679259","display_name":"Linear classifier","level":3,"score":0.41098320484161377},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.41080614924430847},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36782586574554443},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.13177627325057983},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.31577/cai_2020_5_881","is_oa":true,"landing_page_url":"https://doi.org/10.31577/cai_2020_5_881","pdf_url":"http://www.cai.sk/ojs/index.php/cai/article/download/2020_5_881/1052","source":{"id":"https://openalex.org/S4210200093","display_name":"Computing and Informatics","issn_l":"1335-9150","issn":["1335-9150","2585-8807"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computing and Informatics","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.31577/cai_2020_5_881","is_oa":true,"landing_page_url":"https://doi.org/10.31577/cai_2020_5_881","pdf_url":"http://www.cai.sk/ojs/index.php/cai/article/download/2020_5_881/1052","source":{"id":"https://openalex.org/S4210200093","display_name":"Computing and Informatics","issn_l":"1335-9150","issn":["1335-9150","2585-8807"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computing and Informatics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320323425","display_name":"Anna University","ror":"https://ror.org/01qhf1r47"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3145855438.pdf","grobid_xml":"https://content.openalex.org/works/W3145855438.grobid-xml"},"referenced_works_count":44,"referenced_works":["https://openalex.org/W140742851","https://openalex.org/W251061919","https://openalex.org/W1590729858","https://openalex.org/W1826790618","https://openalex.org/W1982589161","https://openalex.org/W1986190044","https://openalex.org/W1987504723","https://openalex.org/W1993539890","https://openalex.org/W1999635750","https://openalex.org/W2008794359","https://openalex.org/W2017337590","https://openalex.org/W2020355555","https://openalex.org/W2032793012","https://openalex.org/W2044127635","https://openalex.org/W2047328133","https://openalex.org/W2087327261","https://openalex.org/W2090874595","https://openalex.org/W2093452304","https://openalex.org/W2103333826","https://openalex.org/W2110848057","https://openalex.org/W2118020653","https://openalex.org/W2118965172","https://openalex.org/W2134090438","https://openalex.org/W2135813353","https://openalex.org/W2140321362","https://openalex.org/W2149684865","https://openalex.org/W2150747245","https://openalex.org/W2150827944","https://openalex.org/W2169384781","https://openalex.org/W2170397402","https://openalex.org/W2172000360","https://openalex.org/W2207631730","https://openalex.org/W2340455672","https://openalex.org/W2476011396","https://openalex.org/W2566823011","https://openalex.org/W2792328264","https://openalex.org/W2949836779","https://openalex.org/W2998216295","https://openalex.org/W3048037280","https://openalex.org/W4213009331","https://openalex.org/W4235113149","https://openalex.org/W4236122429","https://openalex.org/W4299726690","https://openalex.org/W4376534080"],"related_works":["https://openalex.org/W20047544","https://openalex.org/W1503496037","https://openalex.org/W2021546954","https://openalex.org/W2249970211","https://openalex.org/W2055840562","https://openalex.org/W2028016548","https://openalex.org/W8815205","https://openalex.org/W2150954665","https://openalex.org/W1597543867","https://openalex.org/W3023727762"],"abstract_inverted_index":{"Feature":[0],"selection":[1,73,140],"plays":[2],"a":[3,42,70,92,131],"vital":[4],"role":[5],"to":[6,55,87],"reduce":[7],"the":[8,12,16,28,33,39,46,50,57,77,81,89,127],"high":[9],"dimension":[10,22],"of":[11,24,41,45,49,91],"feature":[13,25,72,96,139],"space":[14,26],"in":[15,59],"text":[17,34,51,119],"document":[18,78],"classification":[19,35,133],"problem.":[20],"The":[21,94,122],"reduction":[23],"reduces":[27],"computation":[29],"cost":[30],"and":[31,80,110],"improves":[32],"system":[36],"accuracy.":[37,65],"Hence,":[38],"identification":[40],"proper":[43],"subset":[44,97],"significant":[47],"features":[48],"corpus":[52,120],"is":[53,85,99,105],"needed":[54],"classify":[56],"data":[58],"less":[60],"computational":[61],"time":[62],"with":[63,115,137],"higher":[64],"In":[66],"this":[67],"proposed":[68,103,128],"research,":[69],"novel":[71],"method":[74,129],"which":[75,98],"combines":[76],"frequency":[79,83],"term":[82],"(FS-DFTF)":[84],"used":[86],"measure":[88],"significance":[90],"term.":[93],"optimal":[95],"selected":[100],"by":[101],"our":[102],"work":[104],"evaluated":[106],"using":[107],"Naive":[108],"Bayes":[109],"Support":[111],"Vector":[112],"Machine":[113],"classifier":[114],"various":[116],"popular":[117],"benchmark":[118],"datasets.":[121],"experimental":[123],"outcome":[124],"confirms":[125],"that":[126],"has":[130],"better":[132],"accuracy":[134],"when":[135],"compared":[136],"other":[138],"techniques.":[141]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":2}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
