{"id":"https://openalex.org/W2151629867","doi":"https://doi.org/10.1109/tai.2003.1250241","title":"Classification of Web documents using a naive Bayes method","display_name":"Classification of Web documents using a naive Bayes method","publication_year":2004,"publication_date":"2004-03-01","ids":{"openalex":"https://openalex.org/W2151629867","doi":"https://doi.org/10.1109/tai.2003.1250241","mag":"2151629867"},"language":"en","primary_location":{"id":"doi:10.1109/tai.2003.1250241","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tai.2003.1250241","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings. 15th IEEE International Conference on Tools with Artificial Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100424366","display_name":"Yong Wang","orcid":"https://orcid.org/0000-0001-7670-3958"},"institutions":[{"id":"https://openalex.org/I99041443","display_name":"Mississippi State University","ror":"https://ror.org/0432jq872","country_code":"US","type":"education","lineage":["https://openalex.org/I4210141039","https://openalex.org/I99041443"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yong Wang","raw_affiliation_strings":["Department of Computer Science & Engineering, Mississippi State University, MS, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science & Engineering, Mississippi State University, MS, USA","institution_ids":["https://openalex.org/I99041443"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110266967","display_name":"Julia Hodges","orcid":null},"institutions":[{"id":"https://openalex.org/I99041443","display_name":"Mississippi State University","ror":"https://ror.org/0432jq872","country_code":"US","type":"education","lineage":["https://openalex.org/I4210141039","https://openalex.org/I99041443"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"J. Hodges","raw_affiliation_strings":["Department of Computer Science & Engineering, Mississippi State University, MS, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science & Engineering, Mississippi State University, MS, USA","institution_ids":["https://openalex.org/I99041443"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074257864","display_name":"Bo Tang","orcid":"https://orcid.org/0000-0001-5708-766X"},"institutions":[{"id":"https://openalex.org/I99041443","display_name":"Mississippi State University","ror":"https://ror.org/0432jq872","country_code":"US","type":"education","lineage":["https://openalex.org/I4210141039","https://openalex.org/I99041443"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bo Tang","raw_affiliation_strings":["Department of Computer Science & Engineering, Mississippi State University, MS, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science & Engineering, Mississippi State University, MS, USA","institution_ids":["https://openalex.org/I99041443"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100424366"],"corresponding_institution_ids":["https://openalex.org/I99041443"],"apc_list":null,"apc_paid":null,"fwci":4.9468,"has_fulltext":false,"cited_by_count":56,"citation_normalized_percentile":{"value":0.9521716,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"560","last_page":"564"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9761999845504761,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8158451318740845},{"id":"https://openalex.org/keywords/naive-bayes-classifier","display_name":"Naive Bayes classifier","score":0.756280243396759},{"id":"https://openalex.org/keywords/document-classification","display_name":"Document classification","score":0.5759395360946655},{"id":"https://openalex.org/keywords/bayes-theorem","display_name":"Bayes' theorem","score":0.5255728363990784},{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.5239995718002319},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5038849711418152},{"id":"https://openalex.org/keywords/knowledge-base","display_name":"Knowledge base","score":0.49374040961265564},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4722948372364044},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4582805037498474},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.4581450819969177},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.451917439699173},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.4220602512359619},{"id":"https://openalex.org/keywords/scheme","display_name":"Scheme (mathematics)","score":0.4216897487640381},{"id":"https://openalex.org/keywords/smoothing","display_name":"Smoothing","score":0.4202631115913391},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.41828519105911255},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.13032624125480652},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09461706876754761},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.09030163288116455}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8158451318740845},{"id":"https://openalex.org/C52001869","wikidata":"https://www.wikidata.org/wiki/Q812530","display_name":"Naive Bayes classifier","level":3,"score":0.756280243396759},{"id":"https://openalex.org/C2780479914","wikidata":"https://www.wikidata.org/wiki/Q302088","display_name":"Document classification","level":2,"score":0.5759395360946655},{"id":"https://openalex.org/C207201462","wikidata":"https://www.wikidata.org/wiki/Q182505","display_name":"Bayes' theorem","level":3,"score":0.5255728363990784},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.5239995718002319},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5038849711418152},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.49374040961265564},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4722948372364044},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4582805037498474},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.4581450819969177},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.451917439699173},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.4220602512359619},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.4216897487640381},{"id":"https://openalex.org/C3770464","wikidata":"https://www.wikidata.org/wiki/Q775963","display_name":"Smoothing","level":2,"score":0.4202631115913391},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.41828519105911255},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.13032624125480652},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09461706876754761},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.09030163288116455},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tai.2003.1250241","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tai.2003.1250241","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings. 15th IEEE International Conference on Tools with Artificial Intelligence","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W208128215","https://openalex.org/W1512730339","https://openalex.org/W1550206324","https://openalex.org/W1591095982","https://openalex.org/W1677069012","https://openalex.org/W1849729440","https://openalex.org/W1965717632","https://openalex.org/W1978394996","https://openalex.org/W2063918473","https://openalex.org/W2087609354","https://openalex.org/W2091271661","https://openalex.org/W2104805531","https://openalex.org/W2114535528","https://openalex.org/W2134214966","https://openalex.org/W2138667301","https://openalex.org/W2140190241","https://openalex.org/W2145905815","https://openalex.org/W2149684865","https://openalex.org/W2161457724","https://openalex.org/W2435251607","https://openalex.org/W4251909837","https://openalex.org/W6638875480","https://openalex.org/W6679878807","https://openalex.org/W6681847765","https://openalex.org/W6682304300","https://openalex.org/W6717827561"],"related_works":["https://openalex.org/W2537862391","https://openalex.org/W2417174640","https://openalex.org/W4386023432","https://openalex.org/W4317422759","https://openalex.org/W2968744947","https://openalex.org/W4385770464","https://openalex.org/W4300816751","https://openalex.org/W4224262160","https://openalex.org/W2126538150","https://openalex.org/W2324052717"],"abstract_inverted_index":{"This":[0,58],"paper":[1,59],"presents":[2],"an":[3],"automatic":[4],"document":[5],"classification":[6,19,45],"system,":[7],"WebDoc,":[8],"which":[9],"classifies":[10,32],"Web":[11,110],"documents":[12,34,111],"according":[13],"to":[14],"the":[15,27,33,39,44,71,89,105],"Library":[16],"of":[17,43,64,91,96],"Congress":[18],"scheme.":[20],"WebDoc":[21,49,106],"constructs":[22],"a":[23],"knowledge":[24,40],"base":[25],"from":[26,55],"training":[28],"data":[29],"and":[30,79,99,113],"then":[31],"based":[35,51],"on":[36,52],"information":[37],"in":[38,48,94],"base.":[41],"One":[42],"algorithms":[46],"used":[47],"is":[50],"Bayes'":[53],"theorem":[54],"probability":[56,76],"theory.":[57],"focuses":[60],"upon":[61],"three":[62],"aspects":[63],"this":[65,85],"approach:":[66],"different":[67,75,80],"event":[68],"models":[69],"for":[70],"naive":[72],"Bayes":[73],"method,":[74],"smoothing":[77],"methods,":[78],"feature":[81],"selection":[82],"methods.":[83],"In":[84],"paper,":[86],"we":[87],"report":[88],"performance":[90],"each":[92],"method":[93],"terms":[95],"recall,":[97],"precision,":[98],"F-measures.":[100],"Experimental":[101],"results":[102],"show":[103],"that":[104],"system":[107],"can":[108],"classify":[109],"effectively":[112],"efficiently.":[114]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":1},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":2},{"year":2014,"cited_by_count":4},{"year":2013,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
