{"id":"https://openalex.org/W32754319","doi":"https://doi.org/10.3233/978-1-60750-939-4-421","title":"A Probabilistic Information Retrieval Approach to Medical Annotation in SWISS-PROT","display_name":"A Probabilistic Information Retrieval Approach to Medical Annotation in SWISS-PROT","publication_year":2003,"publication_date":"2003-01-01","ids":{"openalex":"https://openalex.org/W32754319","doi":"https://doi.org/10.3233/978-1-60750-939-4-421","mag":"32754319","pmid":"https://pubmed.ncbi.nlm.nih.gov/14664023"},"language":"en","primary_location":{"id":"doi:10.3233/978-1-60750-939-4-421","is_oa":false,"landing_page_url":"https://doi.org/10.3233/978-1-60750-939-4-421","pdf_url":null,"source":{"id":"https://openalex.org/S4210179765","display_name":"Studies in health technology and informatics","issn_l":"0926-9630","issn":["0926-9630","1879-8365"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318577","host_organization_name":"IOS Press","host_organization_lineage":["https://openalex.org/P4310318577"],"host_organization_lineage_names":["IOS Press"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Studies in Health Technology and Informatics","raw_type":"book-chapter"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053076556","display_name":"Pavel B. Dobrokhotov","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Dobrokhotov Pavel B.","raw_affiliation_strings":["Pavel.Dobrokhotov@isb-sib.ch"],"affiliations":[{"raw_affiliation_string":"Pavel.Dobrokhotov@isb-sib.ch","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065257553","display_name":"Cyril Goutte","orcid":"https://orcid.org/0000-0003-4939-6555"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Goutte Cyril","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108470417","display_name":"Anne\u2010Lise Veuthey","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Veuthey Anne-Lise","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5014352159","display_name":"\u00c9ric Gaussier","orcid":"https://orcid.org/0000-0002-8858-3233"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gaussier Eric","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5053076556"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.7929,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.9090818,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"95","issue":null,"first_page":"421","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9898999929428101,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.7087249159812927},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7028400897979736},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.6783983111381531},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5169593691825867},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3336804509162903},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.33259424567222595},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.09609928727149963}],"concepts":[{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.7087249159812927},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7028400897979736},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.6783983111381531},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5169593691825867},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3336804509162903},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.33259424567222595},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.09609928727149963}],"mesh":[{"descriptor_ui":"D011336","descriptor_name":"Probability","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D011336","descriptor_name":"Probability","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D011336","descriptor_name":"Probability","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D013557","descriptor_name":"Switzerland","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D013557","descriptor_name":"Switzerland","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D013557","descriptor_name":"Switzerland","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016247","descriptor_name":"Information Storage and Retrieval","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D016247","descriptor_name":"Information Storage and Retrieval","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D016247","descriptor_name":"Information Storage and Retrieval","qualifier_ui":"Q000706","qualifier_name":"statistics & numerical data","is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.3233/978-1-60750-939-4-421","is_oa":false,"landing_page_url":"https://doi.org/10.3233/978-1-60750-939-4-421","pdf_url":null,"source":{"id":"https://openalex.org/S4210179765","display_name":"Studies in health technology and informatics","issn_l":"0926-9630","issn":["0926-9630","1879-8365"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318577","host_organization_name":"IOS Press","host_organization_lineage":["https://openalex.org/P4310318577"],"host_organization_lineage_names":["IOS Press"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Studies in Health Technology and Informatics","raw_type":"book-chapter"},{"id":"pmid:14664023","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/14664023","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Studies in health technology and informatics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8700000047683716,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W591063317","https://openalex.org/W1494021613","https://openalex.org/W1531461961","https://openalex.org/W1540550673","https://openalex.org/W1566012138","https://openalex.org/W1612003148","https://openalex.org/W1978304080","https://openalex.org/W2003144438","https://openalex.org/W2049633694","https://openalex.org/W2104768328","https://openalex.org/W2112081648","https://openalex.org/W2148853951","https://openalex.org/W3011379308"],"related_works":["https://openalex.org/W2361861616","https://openalex.org/W2263699433","https://openalex.org/W2377979023","https://openalex.org/W2218034408","https://openalex.org/W2392921965","https://openalex.org/W2358755282","https://openalex.org/W2625833328","https://openalex.org/W4405124681","https://openalex.org/W1533177136","https://openalex.org/W4380994516"],"abstract_inverted_index":{"The":[0],"goal":[1],"of":[2,5,36,93],"medical":[3],"annotation":[4],"human":[6],"proteins":[7],"in":[8],"Swiss-Prot":[9],"is":[10,28],"to":[11,30,55],"add":[12],"features":[13],"specifically":[14],"intended":[15],"for":[16,76],"researchers":[17],"working":[18],"on":[19,65],"genetic":[20],"diseases":[21],"and":[22,51,71],"polymorphisms.":[23],"For":[24],"this":[25,57],"purpose,":[26],"it":[27],"necessary":[29],"search":[31],"through":[32],"a":[33],"vast":[34],"number":[35],"publications":[37],"containing":[38],"relevant":[39,77],"information.":[40],"Promising":[41],"results":[42],"have":[43],"been":[44],"obtained":[45],"by":[46],"applying":[47],"natural":[48],"language":[49],"processing":[50],"machine":[52],"learning":[53],"techniques":[54],"solve":[56],"problem.":[58],"By":[59],"using":[60],"the":[61],"Probabilistic":[62],"Latent":[63],"Categorizer":[64],"representative":[66],"query":[67],"sets,":[68],"69%":[69],"recall":[70],"59%":[72],"precision":[73],"was":[74],"achieved":[75],"documents.":[78],"This":[79],"classifier":[80],"also":[81],"rejected":[82],"irrelevant":[83],"abstracts":[84],"with":[85],"more":[86],"than":[87],"96%":[88],"precision.":[89],"Better":[90],"linguistic":[91],"pre-processing":[92],"source":[94],"documents":[95],"can":[96],"further":[97],"improve":[98],"such":[99],"computer":[100],"approach.":[101]},"counts_by_year":[{"year":2020,"cited_by_count":1},{"year":2016,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
