{"id":"https://openalex.org/W4407835337","doi":"https://doi.org/10.3233/978-1-60750-949-3-381","title":"Using Symbolic Knowledge in the UMLS to Disambiguate Words in Small Datasets with a Na&amp;iuml;ve Bayes Classifier.","display_name":"Using Symbolic Knowledge in the UMLS to Disambiguate Words in Small Datasets with a Na&amp;iuml;ve Bayes Classifier.","publication_year":2004,"publication_date":"2004-01-01","ids":{"openalex":"https://openalex.org/W4407835337","doi":"https://doi.org/10.3233/978-1-60750-949-3-381"},"language":"en","primary_location":{"id":"doi:10.3233/978-1-60750-949-3-381","is_oa":true,"landing_page_url":"https://doi.org/10.3233/978-1-60750-949-3-381","pdf_url":null,"source":{"id":"https://openalex.org/S4210179765","display_name":"Studies in health technology and informatics","issn_l":"0926-9630","issn":["0926-9630","1879-8365"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318577","host_organization_name":"IOS Press","host_organization_lineage":["https://openalex.org/P4310318577"],"host_organization_lineage_names":["IOS Press"],"type":"book series"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Studies in Health Technology and Informatics","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.3233/978-1-60750-949-3-381","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5116375635","display_name":"Leroy Gondy","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Leroy Gondy","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5110425952","display_name":"Ravindranath R. C","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rindflesch Thomas C.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5116375635"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.3829588,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9787999987602234,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.972599983215332,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/unified-medical-language-system","display_name":"Unified Medical Language System","score":0.7835465669631958},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6974232196807861},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6267260313034058},{"id":"https://openalex.org/keywords/naive-bayes-classifier","display_name":"Naive Bayes classifier","score":0.6226229071617126},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.6010850667953491},{"id":"https://openalex.org/keywords/bayes-theorem","display_name":"Bayes' theorem","score":0.5850900411605835},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5660171508789062},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.14802372455596924}],"concepts":[{"id":"https://openalex.org/C69505689","wikidata":"https://www.wikidata.org/wiki/Q455338","display_name":"Unified Medical Language System","level":2,"score":0.7835465669631958},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6974232196807861},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6267260313034058},{"id":"https://openalex.org/C52001869","wikidata":"https://www.wikidata.org/wiki/Q812530","display_name":"Naive Bayes classifier","level":3,"score":0.6226229071617126},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.6010850667953491},{"id":"https://openalex.org/C207201462","wikidata":"https://www.wikidata.org/wiki/Q182505","display_name":"Bayes' theorem","level":3,"score":0.5850900411605835},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5660171508789062},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.14802372455596924},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/978-1-60750-949-3-381","is_oa":true,"landing_page_url":"https://doi.org/10.3233/978-1-60750-949-3-381","pdf_url":null,"source":{"id":"https://openalex.org/S4210179765","display_name":"Studies in health technology and informatics","issn_l":"0926-9630","issn":["0926-9630","1879-8365"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318577","host_organization_name":"IOS Press","host_organization_lineage":["https://openalex.org/P4310318577"],"host_organization_lineage_names":["IOS Press"],"type":"book series"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Studies in Health Technology and Informatics","raw_type":"book-chapter"}],"best_oa_location":{"id":"doi:10.3233/978-1-60750-949-3-381","is_oa":true,"landing_page_url":"https://doi.org/10.3233/978-1-60750-949-3-381","pdf_url":null,"source":{"id":"https://openalex.org/S4210179765","display_name":"Studies in health technology and informatics","issn_l":"0926-9630","issn":["0926-9630","1879-8365"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318577","host_organization_name":"IOS Press","host_organization_lineage":["https://openalex.org/P4310318577"],"host_organization_lineage_names":["IOS Press"],"type":"book series"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Studies in Health Technology and Informatics","raw_type":"book-chapter"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W79619734","https://openalex.org/W2010487328","https://openalex.org/W2340589664","https://openalex.org/W4281750475","https://openalex.org/W3087321790","https://openalex.org/W186091728","https://openalex.org/W2939811865","https://openalex.org/W1822792362","https://openalex.org/W2417174640","https://openalex.org/W1507779355"],"abstract_inverted_index":{"Current":[0],"approaches":[1],"to":[2,14,44,55,148,172],"word":[3,19,91],"sense":[4,88],"disambiguation":[5,162],"use":[6,40],"and":[7,20,23,61],"combine":[8],"various":[9],"machine-learning":[10,46],"techniques.":[11],"Most":[12],"refer":[13],"characteristics":[15],"of":[16,28,41,89,98,126],"the":[17,39,59,68,94,123,127,130,140,160,169,173],"ambiguous":[18],"surrounding":[21],"words":[22,79,128,166],"are":[24],"based":[25,114],"on":[26,115,135],"hundreds":[27],"examples.":[29],"Unfortunately,":[30],"developing":[31],"large":[32],"training":[33],"sets":[34],"is":[35],"time-consuming.":[36],"We":[37],"investigate":[38],"symbolic":[42,101],"knowledge":[43,69,102],"augment":[45],"techniques":[47],"for":[48,77,83,165],"small":[49],"datasets.":[50],"UMLS":[51],"semantic":[52,65,124],"types":[53,66,125],"assigned":[54],"concepts":[56],"found":[57,164],"in":[58,105,129],"sentence":[60],"relationships":[62],"between":[63],"these":[64],"form":[67],"base.":[70],"A":[71],"na&amp;iuml;ve":[72],"Bayes":[73],"classifier":[74],"was":[75,103,110,133,163],"trained":[76],"15":[78],"with":[80],"100":[81],"examples":[82],"each.":[84],"The":[85,96,118],"most":[86],"frequent":[87],"a":[90,152,157],"served":[92],"as":[93],"baseline.":[95],"effect":[97],"increasingly":[99],"accurate":[100],"evaluated":[104],"eight":[106],"experimental":[107],"conditions.":[108],"Performance":[109],"measured":[111],"by":[112],"accuracy":[113],"10-fold":[116],"cross-validation.":[117],"best":[119,161],"condition":[120],"used":[121],"only":[122],"sentence.":[131],"Accuracy":[132],"then":[134],"average":[136],"10%":[137],"higher":[138],"than":[139],"baseline;":[141],"however,":[142],"it":[143],"varied":[144],"from":[145],"8%":[146],"deterioration":[147],"29%":[149],"improvement.":[150],"In":[151],"follow-up":[153],"evaluation,":[154],"we":[155],"noted":[156],"trend":[158],"that":[159,167],"were":[168],"least":[170],"troublesome":[171],"human":[174],"evaluators.":[175]},"counts_by_year":[],"updated_date":"2025-12-21T01:58:51.020947","created_date":"2025-10-10T00:00:00"}
