{"id":"https://openalex.org/W1995766244","doi":"https://doi.org/10.1109/fskd.2014.6980902","title":"New feature selection methods based on context similarity for text categorization","display_name":"New feature selection methods based on context similarity for text categorization","publication_year":2014,"publication_date":"2014-08-01","ids":{"openalex":"https://openalex.org/W1995766244","doi":"https://doi.org/10.1109/fskd.2014.6980902","mag":"1995766244"},"language":"en","primary_location":{"id":"doi:10.1109/fskd.2014.6980902","is_oa":false,"landing_page_url":"https://doi.org/10.1109/fskd.2014.6980902","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 11th International Conference on Fuzzy Systems and Knowledge Discovery (FSKD)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100606731","display_name":"Yifei Chen","orcid":"https://orcid.org/0009-0001-9475-0480"},"institutions":[{"id":"https://openalex.org/I206777745","display_name":"Nanjing Audit University","ror":"https://ror.org/04zj2bd87","country_code":"CN","type":"education","lineage":["https://openalex.org/I206777745"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yifei Chen","raw_affiliation_strings":["School of Information Science, Nanjing Audit University, Nanjing, P. R. China","School of Information Science, Nanjing Audit University, 86 Yushan Rd(W), Nanjing, P.R. China"],"affiliations":[{"raw_affiliation_string":"School of Information Science, Nanjing Audit University, Nanjing, P. R. China","institution_ids":["https://openalex.org/I206777745"]},{"raw_affiliation_string":"School of Information Science, Nanjing Audit University, 86 Yushan Rd(W), Nanjing, P.R. China","institution_ids":["https://openalex.org/I206777745"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102500842","display_name":"Bingqing Han","orcid":null},"institutions":[{"id":"https://openalex.org/I206777745","display_name":"Nanjing Audit University","ror":"https://ror.org/04zj2bd87","country_code":"CN","type":"education","lineage":["https://openalex.org/I206777745"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bingqing Han","raw_affiliation_strings":["School of Information Science, Nanjing Audit University, Nanjing, P. R. China","School of Information Science, Nanjing Audit University, 86 Yushan Rd(W), Nanjing, P.R. China"],"affiliations":[{"raw_affiliation_string":"School of Information Science, Nanjing Audit University, Nanjing, P. R. China","institution_ids":["https://openalex.org/I206777745"]},{"raw_affiliation_string":"School of Information Science, Nanjing Audit University, 86 Yushan Rd(W), Nanjing, P.R. China","institution_ids":["https://openalex.org/I206777745"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5072638565","display_name":"Ping Hou","orcid":"https://orcid.org/0000-0003-1001-3107"},"institutions":[{"id":"https://openalex.org/I2277624104","display_name":"Fondazione Bruno Kessler","ror":"https://ror.org/01j33xk10","country_code":"IT","type":"facility","lineage":["https://openalex.org/I2277624104"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Ping Hou","raw_affiliation_strings":["Fondazione Bruno Kessler (FBK-irst), Trento, Italy","Fondazione Bruno Kessler, FBK-irst, Trento, Italy#TAB#"],"affiliations":[{"raw_affiliation_string":"Fondazione Bruno Kessler (FBK-irst), Trento, Italy","institution_ids":["https://openalex.org/I2277624104"]},{"raw_affiliation_string":"Fondazione Bruno Kessler, FBK-irst, Trento, Italy#TAB#","institution_ids":["https://openalex.org/I2277624104"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100606731"],"corresponding_institution_ids":["https://openalex.org/I206777745"],"apc_list":null,"apc_paid":null,"fwci":0.409,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.72863082,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"598","last_page":"604"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9855999946594238,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9836999773979187,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.728837251663208},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6800087094306946},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.6000375151634216},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5915517807006836},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5806263089179993},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.5274061560630798},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5042604207992554},{"id":"https://openalex.org/keywords/categorization","display_name":"Categorization","score":0.48759427666664124},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.46376940608024597},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.37304437160491943},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.354606568813324}],"concepts":[{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.728837251663208},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6800087094306946},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.6000375151634216},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5915517807006836},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5806263089179993},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.5274061560630798},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5042604207992554},{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.48759427666664124},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.46376940608024597},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.37304437160491943},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.354606568813324},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/fskd.2014.6980902","is_oa":false,"landing_page_url":"https://doi.org/10.1109/fskd.2014.6980902","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 11th International Conference on Fuzzy Systems and Knowledge Discovery (FSKD)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.6299999952316284}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W41404523","https://openalex.org/W327991062","https://openalex.org/W1537207111","https://openalex.org/W1585793187","https://openalex.org/W1592683066","https://openalex.org/W1982589161","https://openalex.org/W1999635750","https://openalex.org/W2027147487","https://openalex.org/W2032793012","https://openalex.org/W2034190452","https://openalex.org/W2040884411","https://openalex.org/W2045358009","https://openalex.org/W2053699633","https://openalex.org/W2084439920","https://openalex.org/W2089870669","https://openalex.org/W2103333826","https://openalex.org/W2112543617","https://openalex.org/W2118020653","https://openalex.org/W2119387367","https://openalex.org/W2128600649","https://openalex.org/W2147276454","https://openalex.org/W2148603752","https://openalex.org/W2153635508","https://openalex.org/W2162223169","https://openalex.org/W2166183437","https://openalex.org/W2169611088","https://openalex.org/W3120421331","https://openalex.org/W3120740533","https://openalex.org/W4254721730","https://openalex.org/W6601696544","https://openalex.org/W6631973990","https://openalex.org/W6675969814"],"related_works":["https://openalex.org/W2165912799","https://openalex.org/W2735662278","https://openalex.org/W2382615723","https://openalex.org/W4311804456","https://openalex.org/W151699219","https://openalex.org/W2047139419","https://openalex.org/W2085633464","https://openalex.org/W1966122760","https://openalex.org/W4386564352","https://openalex.org/W2952668426"],"abstract_inverted_index":{"High":[0],"dimensionality":[1,26],"of":[2,8,27,66,97,103,187],"the":[3,9,25,32,36,58,64,95,101,107,110,161,170,174,180,188,202,207],"feature":[4,18,42,47,72,128,211],"space":[5],"is":[6,20],"one":[7],"most":[10],"important":[11],"concerns":[12],"in":[13,185],"text":[14],"categorization":[15],"problems,":[16],"and":[17,49,86,145,158,190,197],"selection":[19,43,73,129,212],"widely":[21],"used":[22],"for":[23,216],"reducing":[24],"features":[28,98,115],"to":[29,56,116],"speed":[30],"up":[31],"computation":[33],"without":[34],"damaging":[35],"performance.":[37],"However,":[38],"a":[39],"lot":[40],"traditional":[41],"methods":[44,178,184,213],"treat":[45],"each":[46],"separately,":[48],"they":[50],"are":[51,152,214],"context":[52,118,125,175,208],"independent.":[53],"In":[54],"order":[55],"address":[57],"problem,":[59],"this":[60],"paper":[61],"first":[62],"presents":[63],"study":[65],"four":[67,123,162],"well":[68],"known":[69],"frequency":[70,112,164,182],"based":[71,127,165,177,183,210],"methods,":[74,130],"including":[75],"Gini":[76],"Index":[77],"(GI),":[78],"Document":[79],"Frequency":[80],"(DF),":[81],"Class":[82],"Discriminating":[83],"Measure":[84],"(CDM)":[85],"Accuracy":[87],"Balanced":[88],"(Acc2).":[89],"Then":[90],"we":[91,121],"focus":[92],"on":[93,154,195],"calculating":[94],"importance":[96],"through":[99],"measuring":[100],"similarity":[102,126,176,209],"their":[104],"contexts":[105],"among":[106],"documents":[108],"but":[109],"document":[111],"containing":[113],"these":[114],"incorporate":[117],"information.":[119],"Hence":[120],"propose":[122],"new":[124],"GI":[131],"<sub":[132,137,142,147],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[133,138,143,148],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">cs</sub>":[134,139,144,149],",":[135,140],"DF":[136],"CDM":[141],"Acc2":[146],".":[150],"They":[151],"evaluated":[153],"different":[155],"data":[156],"sets":[157],"compared":[159],"against":[160],"corresponding":[163,181],"methods.":[166],"Through":[167],"experimental":[168],"analysis,":[169],"results":[171],"reveal":[172],"that":[173],"outperform":[179],"terms":[186],"micro":[189],"macro":[191],"F1":[192],"measures":[193],"both":[194],"binary":[196],"multi-classification":[198],"problems.":[199],"Benefit":[200],"from":[201],"multi-words":[203],"information":[204],"surrounding":[205],"features,":[206],"effective":[215],"article":[217],"categorization.":[218]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":4},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
