{"id":"https://openalex.org/W2104544690","doi":"https://doi.org/10.1186/1471-2105-13-16","title":"Automatic categorization of diverse experimental information in the bioscience literature","display_name":"Automatic categorization of diverse experimental information in the bioscience literature","publication_year":2012,"publication_date":"2012-01-26","ids":{"openalex":"https://openalex.org/W2104544690","doi":"https://doi.org/10.1186/1471-2105-13-16","mag":"2104544690","pmid":"https://pubmed.ncbi.nlm.nih.gov/22280404"},"language":"en","primary_location":{"id":"doi:10.1186/1471-2105-13-16","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-13-16","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-13-16","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-13-16","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022121743","display_name":"Ruihua Fang","orcid":"https://orcid.org/0000-0001-5102-7156"},"institutions":[{"id":"https://openalex.org/I122411786","display_name":"California Institute of Technology","ror":"https://ror.org/05dxps055","country_code":"US","type":"education","lineage":["https://openalex.org/I122411786"]},{"id":"https://openalex.org/I1344073410","display_name":"Howard Hughes Medical Institute","ror":"https://ror.org/006w34k90","country_code":"US","type":"facility","lineage":["https://openalex.org/I1344073410"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ruihua Fang","raw_affiliation_strings":["Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, CA 91125, USA","Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, CA 91125, USA","institution_ids":["https://openalex.org/I1344073410"]},{"raw_affiliation_string":"Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, USA","institution_ids":["https://openalex.org/I122411786"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083706322","display_name":"Gary Schindelman","orcid":null},"institutions":[{"id":"https://openalex.org/I122411786","display_name":"California Institute of Technology","ror":"https://ror.org/05dxps055","country_code":"US","type":"education","lineage":["https://openalex.org/I122411786"]},{"id":"https://openalex.org/I1344073410","display_name":"Howard Hughes Medical Institute","ror":"https://ror.org/006w34k90","country_code":"US","type":"facility","lineage":["https://openalex.org/I1344073410"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gary Schindelman","raw_affiliation_strings":["Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, CA, 91125, USA","Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, CA, 91125, USA","institution_ids":["https://openalex.org/I122411786","https://openalex.org/I1344073410"]},{"raw_affiliation_string":"Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, USA","institution_ids":["https://openalex.org/I122411786"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034108611","display_name":"Kimberly Van Auken","orcid":"https://orcid.org/0000-0002-1706-4196"},"institutions":[{"id":"https://openalex.org/I122411786","display_name":"California Institute of Technology","ror":"https://ror.org/05dxps055","country_code":"US","type":"education","lineage":["https://openalex.org/I122411786"]},{"id":"https://openalex.org/I1344073410","display_name":"Howard Hughes Medical Institute","ror":"https://ror.org/006w34k90","country_code":"US","type":"facility","lineage":["https://openalex.org/I1344073410"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kimberly Van Auken","raw_affiliation_strings":["Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, CA, 91125, USA","Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, CA, 91125, USA","institution_ids":["https://openalex.org/I122411786","https://openalex.org/I1344073410"]},{"raw_affiliation_string":"Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, USA","institution_ids":["https://openalex.org/I122411786"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047836268","display_name":"Jolene S. Fernandes","orcid":null},"institutions":[{"id":"https://openalex.org/I122411786","display_name":"California Institute of Technology","ror":"https://ror.org/05dxps055","country_code":"US","type":"education","lineage":["https://openalex.org/I122411786"]},{"id":"https://openalex.org/I1344073410","display_name":"Howard Hughes Medical Institute","ror":"https://ror.org/006w34k90","country_code":"US","type":"facility","lineage":["https://openalex.org/I1344073410"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jolene Fernandes","raw_affiliation_strings":["Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, CA, 91125, USA","Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, CA, 91125, USA","institution_ids":["https://openalex.org/I122411786","https://openalex.org/I1344073410"]},{"raw_affiliation_string":"Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, USA","institution_ids":["https://openalex.org/I122411786"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100344186","display_name":"Wen Chen","orcid":"https://orcid.org/0000-0003-0853-7526"},"institutions":[{"id":"https://openalex.org/I122411786","display_name":"California Institute of Technology","ror":"https://ror.org/05dxps055","country_code":"US","type":"education","lineage":["https://openalex.org/I122411786"]},{"id":"https://openalex.org/I1344073410","display_name":"Howard Hughes Medical Institute","ror":"https://ror.org/006w34k90","country_code":"US","type":"facility","lineage":["https://openalex.org/I1344073410"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wen Chen","raw_affiliation_strings":["Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, CA, 91125, USA","Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, CA, 91125, USA","institution_ids":["https://openalex.org/I122411786","https://openalex.org/I1344073410"]},{"raw_affiliation_string":"Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, USA","institution_ids":["https://openalex.org/I122411786"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100382645","display_name":"Xiaodong Wang","orcid":"https://orcid.org/0000-0001-9885-356X"},"institutions":[{"id":"https://openalex.org/I122411786","display_name":"California Institute of Technology","ror":"https://ror.org/05dxps055","country_code":"US","type":"education","lineage":["https://openalex.org/I122411786"]},{"id":"https://openalex.org/I1344073410","display_name":"Howard Hughes Medical Institute","ror":"https://ror.org/006w34k90","country_code":"US","type":"facility","lineage":["https://openalex.org/I1344073410"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaodong Wang","raw_affiliation_strings":["Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, CA, 91125, USA","Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, CA, 91125, USA","institution_ids":["https://openalex.org/I122411786","https://openalex.org/I1344073410"]},{"raw_affiliation_string":"Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, USA","institution_ids":["https://openalex.org/I122411786"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028184419","display_name":"Paul A. Davis","orcid":"https://orcid.org/0000-0001-5545-0824"},"institutions":[{"id":"https://openalex.org/I2802476451","display_name":"Wellcome Sanger Institute","ror":"https://ror.org/05cy4wa09","country_code":"GB","type":"nonprofit","lineage":["https://openalex.org/I2802476451","https://openalex.org/I87048295"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Paul Davis","raw_affiliation_strings":["Wellcome Trust Sanger Institute, Wellcome Trust Genome Campus, Cambridge, CB10 1SA, UK","Wellcome Trust Sanger Institute,  Wellcome Trust Genome Campus, Cambridge, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Wellcome Trust Sanger Institute, Wellcome Trust Genome Campus, Cambridge, CB10 1SA, UK","institution_ids":["https://openalex.org/I2802476451"]},{"raw_affiliation_string":"Wellcome Trust Sanger Institute,  Wellcome Trust Genome Campus, Cambridge, UK","institution_ids":["https://openalex.org/I2802476451"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026096278","display_name":"Mary Ann Tuli","orcid":"https://orcid.org/0000-0002-4667-9528"},"institutions":[{"id":"https://openalex.org/I2802476451","display_name":"Wellcome Sanger Institute","ror":"https://ror.org/05cy4wa09","country_code":"GB","type":"nonprofit","lineage":["https://openalex.org/I2802476451","https://openalex.org/I87048295"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Mary Ann Tuli","raw_affiliation_strings":["Wellcome Trust Sanger Institute, Wellcome Trust Genome Campus, Cambridge, CB10 1SA, UK","Wellcome Trust Sanger Institute,  Wellcome Trust Genome Campus, Cambridge, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Wellcome Trust Sanger Institute, Wellcome Trust Genome Campus, Cambridge, CB10 1SA, UK","institution_ids":["https://openalex.org/I2802476451"]},{"raw_affiliation_string":"Wellcome Trust Sanger Institute,  Wellcome Trust Genome Campus, Cambridge, UK","institution_ids":["https://openalex.org/I2802476451"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005252212","display_name":"Steven J Marygold","orcid":"https://orcid.org/0000-0003-2759-266X"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Steven J Marygold","raw_affiliation_strings":["Department of Genetics, University of Cambridge, Downing Street, Cambridge, CB2 3EH, UK","Department of Genetics University of Cambridge, Cambridge, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Genetics, University of Cambridge, Downing Street, Cambridge, CB2 3EH, UK","institution_ids":["https://openalex.org/I241749"]},{"raw_affiliation_string":"Department of Genetics University of Cambridge, Cambridge, UK","institution_ids":["https://openalex.org/I241749"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039497090","display_name":"Gillian Millburn","orcid":"https://orcid.org/0000-0002-1139-1145"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Gillian Millburn","raw_affiliation_strings":["Department of Genetics, University of Cambridge, Downing Street, Cambridge, CB2 3EH, UK","Department of Genetics University of Cambridge, Cambridge, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Genetics, University of Cambridge, Downing Street, Cambridge, CB2 3EH, UK","institution_ids":["https://openalex.org/I241749"]},{"raw_affiliation_string":"Department of Genetics University of Cambridge, Cambridge, UK","institution_ids":["https://openalex.org/I241749"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022378337","display_name":"Beverley Matthews","orcid":"https://orcid.org/0000-0002-0967-1076"},"institutions":[{"id":"https://openalex.org/I136199984","display_name":"Harvard University","ror":"https://ror.org/03vek6s52","country_code":"US","type":"education","lineage":["https://openalex.org/I136199984"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Beverley Matthews","raw_affiliation_strings":["Department of Molecular and Cellular Biology, Harvard University, Cambridge, MA, 02138, USA","Department of Molecular & Cellular Biology, Harvard University, Cambridge, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Molecular and Cellular Biology, Harvard University, Cambridge, MA, 02138, USA","institution_ids":["https://openalex.org/I136199984"]},{"raw_affiliation_string":"Department of Molecular & Cellular Biology, Harvard University, Cambridge, USA","institution_ids":["https://openalex.org/I136199984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100325488","display_name":"Haiyan Zhang","orcid":"https://orcid.org/0000-0002-2877-2040"},"institutions":[{"id":"https://openalex.org/I136199984","display_name":"Harvard University","ror":"https://ror.org/03vek6s52","country_code":"US","type":"education","lineage":["https://openalex.org/I136199984"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Haiyan Zhang","raw_affiliation_strings":["Department of Molecular and Cellular Biology, Harvard University, Cambridge, MA, 02138, USA","Department of Molecular & Cellular Biology, Harvard University, Cambridge, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Molecular and Cellular Biology, Harvard University, Cambridge, MA, 02138, USA","institution_ids":["https://openalex.org/I136199984"]},{"raw_affiliation_string":"Department of Molecular & Cellular Biology, Harvard University, Cambridge, USA","institution_ids":["https://openalex.org/I136199984"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Nick Brown","orcid":null},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]},{"id":"https://openalex.org/I2801782436","display_name":"The Gurdon Institute","ror":"https://ror.org/00fp3ce15","country_code":"GB","type":"facility","lineage":["https://openalex.org/I241749","https://openalex.org/I2801316944","https://openalex.org/I2801782436","https://openalex.org/I87048295"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Nick Brown","raw_affiliation_strings":["The Gurdon Institute and Department of Physiology, Development & Neuroscience, University of Cambridge, Tennis Court Road, Cambridge, CB2 1QN, UK","The Gurdon Institute and Department of Physiology, Development and Neuroscience, University of Cambridge, Cambridge, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Gurdon Institute and Department of Physiology, Development & Neuroscience, University of Cambridge, Tennis Court Road, Cambridge, CB2 1QN, UK","institution_ids":["https://openalex.org/I2801782436","https://openalex.org/I241749"]},{"raw_affiliation_string":"The Gurdon Institute and Department of Physiology, Development and Neuroscience, University of Cambridge, Cambridge, UK","institution_ids":["https://openalex.org/I2801782436","https://openalex.org/I241749"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109425503","display_name":"William M Gelbart","orcid":null},"institutions":[{"id":"https://openalex.org/I136199984","display_name":"Harvard University","ror":"https://ror.org/03vek6s52","country_code":"US","type":"education","lineage":["https://openalex.org/I136199984"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"William M Gelbart","raw_affiliation_strings":["Department of Molecular and Cellular Biology, Harvard University, Cambridge, MA, 02138, USA","Department of Molecular & Cellular Biology, Harvard University, Cambridge, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Molecular and Cellular Biology, Harvard University, Cambridge, MA, 02138, USA","institution_ids":["https://openalex.org/I136199984"]},{"raw_affiliation_string":"Department of Molecular & Cellular Biology, Harvard University, Cambridge, USA","institution_ids":["https://openalex.org/I136199984"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033624132","display_name":"Paul W. Sternberg","orcid":"https://orcid.org/0000-0002-7699-0173"},"institutions":[{"id":"https://openalex.org/I122411786","display_name":"California Institute of Technology","ror":"https://ror.org/05dxps055","country_code":"US","type":"education","lineage":["https://openalex.org/I122411786"]},{"id":"https://openalex.org/I1344073410","display_name":"Howard Hughes Medical Institute","ror":"https://ror.org/006w34k90","country_code":"US","type":"facility","lineage":["https://openalex.org/I1344073410"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Paul W Sternberg","raw_affiliation_strings":["Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, CA, 91125, USA","Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, CA, 91125, USA","institution_ids":["https://openalex.org/I122411786","https://openalex.org/I1344073410"]},{"raw_affiliation_string":"Howard Hughes Medical Institute and Biology Division, California Institute of Technology, Pasadena, USA","institution_ids":["https://openalex.org/I122411786"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":15,"corresponding_author_ids":["https://openalex.org/A5033624132"],"corresponding_institution_ids":["https://openalex.org/I122411786","https://openalex.org/I1344073410"],"apc_list":{"value":1690,"currency":"GBP","value_usd":2072},"apc_paid":{"value":1690,"currency":"GBP","value_usd":2072},"fwci":1.7467,"has_fulltext":true,"cited_by_count":39,"citation_normalized_percentile":{"value":0.84326017,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"13","issue":"1","first_page":"16","last_page":"16"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.8989999890327454,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.8989999890327454,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.023399999365210533,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.014999999664723873,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7464109659194946},{"id":"https://openalex.org/keywords/categorization","display_name":"Categorization","score":0.6891914010047913},{"id":"https://openalex.org/keywords/data-curation","display_name":"Data curation","score":0.6238945722579956},{"id":"https://openalex.org/keywords/biological-database","display_name":"Biological database","score":0.6166089773178101},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5863112211227417},{"id":"https://openalex.org/keywords/data-type","display_name":"Data type","score":0.5196191668510437},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4813864529132843},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.47486281394958496},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.4126933515071869},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.39457249641418457},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3363063931465149},{"id":"https://openalex.org/keywords/bioinformatics","display_name":"Bioinformatics","score":0.24729230999946594},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.09638795256614685}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7464109659194946},{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.6891914010047913},{"id":"https://openalex.org/C91632574","wikidata":"https://www.wikidata.org/wiki/Q15088675","display_name":"Data curation","level":2,"score":0.6238945722579956},{"id":"https://openalex.org/C20901353","wikidata":"https://www.wikidata.org/wiki/Q4117139","display_name":"Biological database","level":2,"score":0.6166089773178101},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5863112211227417},{"id":"https://openalex.org/C138958017","wikidata":"https://www.wikidata.org/wiki/Q190087","display_name":"Data type","level":2,"score":0.5196191668510437},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4813864529132843},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.47486281394958496},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.4126933515071869},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.39457249641418457},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3363063931465149},{"id":"https://openalex.org/C60644358","wikidata":"https://www.wikidata.org/wiki/Q128570","display_name":"Bioinformatics","level":1,"score":0.24729230999946594},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.09638795256614685},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000818","descriptor_name":"Animals","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000818","descriptor_name":"Animals","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000818","descriptor_name":"Animals","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001331","descriptor_name":"Automation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001331","descriptor_name":"Automation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001331","descriptor_name":"Automation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D004331","descriptor_name":"Drosophila melanogaster","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D004331","descriptor_name":"Drosophila melanogaster","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D004331","descriptor_name":"Drosophila melanogaster","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011642","descriptor_name":"Publications","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011642","descriptor_name":"Publications","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011642","descriptor_name":"Publications","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017173","descriptor_name":"Caenorhabditis elegans","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D017173","descriptor_name":"Caenorhabditis elegans","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D017173","descriptor_name":"Caenorhabditis elegans","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D023281","descriptor_name":"Genomics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D051379","descriptor_name":"Mice","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D051379","descriptor_name":"Mice","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D051379","descriptor_name":"Mice","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D060388","descriptor_name":"Support Vector Machine","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D060388","descriptor_name":"Support Vector Machine","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D060388","descriptor_name":"Support Vector Machine","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":6,"locations":[{"id":"doi:10.1186/1471-2105-13-16","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-13-16","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-13-16","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},{"id":"pmid:22280404","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/22280404","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC bioinformatics","raw_type":null},{"id":"pmh:oai:authors.library.caltech.edu:29784","is_oa":true,"landing_page_url":"https://authors.library.caltech.edu/29784/","pdf_url":null,"source":{"id":"https://openalex.org/S4306402161","display_name":"CaltechAUTHORS (California Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I122411786","host_organization_name":"California Institute of Technology","host_organization_lineage":["https://openalex.org/I122411786"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article"},{"id":"pmh:oai:dash.harvard.edu:1/11248784","is_oa":true,"landing_page_url":"http://nrs.harvard.edu/urn-3:HUL.InstRepos:11248784","pdf_url":null,"source":{"id":"https://openalex.org/S4306401540","display_name":"Digital Access to Scholarship at Harvard (DASH) (Harvard University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I136199984","host_organization_name":"Harvard University","host_organization_lineage":["https://openalex.org/I136199984"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Journal Article"},{"id":"pmh:oai:doaj.org/article:bed8b18ae930465f8ba11241758bd777","is_oa":true,"landing_page_url":"https://doaj.org/article/bed8b18ae930465f8ba11241758bd777","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BMC Bioinformatics, Vol 13, Iss 1, p 16 (2012)","raw_type":"article"},{"id":"pmh:oai:pubmedcentral.nih.gov:3305665","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/3305665","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BMC Bioinformatics","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1186/1471-2105-13-16","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-13-16","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-13-16","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4463229245","display_name":null,"funder_award_id":"HG002223","funder_id":"https://openalex.org/F4320337348","funder_display_name":"National Human Genome Research Institute"}],"funders":[{"id":"https://openalex.org/F4320306082","display_name":"Howard Hughes Medical Institute","ror":"https://ror.org/006w34k90"},{"id":"https://openalex.org/F4320332161","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88"},{"id":"https://openalex.org/F4320337348","display_name":"National Human Genome Research Institute","ror":"https://ror.org/00baak391"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2104544690.pdf","grobid_xml":"https://content.openalex.org/works/W2104544690.grobid-xml"},"referenced_works_count":61,"referenced_works":["https://openalex.org/W740415","https://openalex.org/W114870494","https://openalex.org/W119778216","https://openalex.org/W124454490","https://openalex.org/W140600869","https://openalex.org/W149595388","https://openalex.org/W161282504","https://openalex.org/W195873702","https://openalex.org/W202303397","https://openalex.org/W1480287196","https://openalex.org/W1485124666","https://openalex.org/W1492082341","https://openalex.org/W1532325895","https://openalex.org/W1540550673","https://openalex.org/W1576520375","https://openalex.org/W1603229901","https://openalex.org/W1604792744","https://openalex.org/W1604938182","https://openalex.org/W1704134116","https://openalex.org/W1968537328","https://openalex.org/W1994306321","https://openalex.org/W2002857471","https://openalex.org/W2005422315","https://openalex.org/W2053673723","https://openalex.org/W2053724458","https://openalex.org/W2073051186","https://openalex.org/W2091940856","https://openalex.org/W2097052916","https://openalex.org/W2097106271","https://openalex.org/W2103308144","https://openalex.org/W2103333826","https://openalex.org/W2105948726","https://openalex.org/W2107141268","https://openalex.org/W2116796547","https://openalex.org/W2123273303","https://openalex.org/W2123766055","https://openalex.org/W2126276057","https://openalex.org/W2131730455","https://openalex.org/W2138229177","https://openalex.org/W2138505392","https://openalex.org/W2139259976","https://openalex.org/W2141341393","https://openalex.org/W2141921295","https://openalex.org/W2144181601","https://openalex.org/W2146486983","https://openalex.org/W2149684865","https://openalex.org/W2153635508","https://openalex.org/W2154159734","https://openalex.org/W2155529673","https://openalex.org/W2156909104","https://openalex.org/W2170654002","https://openalex.org/W2297432279","https://openalex.org/W2435251607","https://openalex.org/W2475645889","https://openalex.org/W2792952625","https://openalex.org/W3087927280","https://openalex.org/W3120421331","https://openalex.org/W4213009331","https://openalex.org/W4302501099","https://openalex.org/W6679915611","https://openalex.org/W6680954332"],"related_works":["https://openalex.org/W2165912799","https://openalex.org/W2735662278","https://openalex.org/W2762474792","https://openalex.org/W2111303602","https://openalex.org/W2772431536","https://openalex.org/W2951897737","https://openalex.org/W2891678595","https://openalex.org/W2097106271","https://openalex.org/W2124450377","https://openalex.org/W1968095293"],"abstract_inverted_index":{"BACKGROUND:":[0],"Curation":[1],"of":[2,15,70,95,135,157,213,220,234,254,311,349,394],"information":[3,18,69],"from":[4,34,217,281,286,292],"bioscience":[5],"literature":[6,37,221],"into":[7],"biological":[8],"knowledge":[9],"databases":[10,183],"is":[11,31,50,74,112,153,298,364],"a":[12,20,27,44,92,204,239,257,347,359],"crucial":[13],"way":[14],"capturing":[16],"experimental":[17,122,138],"in":[19,52,128,130,140,154,160,184,301],"computable":[21],"form.":[22],"During":[23],"the":[24,38,48,101,141,147,155,161,167,185,275,302,383,391,396],"biocuration":[25,142,162,186,400],"process,":[26],"critical":[28],"first":[29],"step":[30,55],"to":[32,59,64,120,209,229,267,346,358,373,390],"identify":[33,230],"all":[35],"published":[36,96,313],"papers":[39,63,85,98,212,231,266,314],"that":[40,174,382],"contain":[41,68],"results":[42],"for":[43,83,132,146,238,248,308],"specific":[45],"data":[46,89,123,215,236,250,279,284,290,317,350],"type":[47],"curator":[49],"interested":[51],"annotating.":[53],"This":[54,109,242],"normally":[56],"requires":[57],"curators":[58],"manually":[60],"examine":[61],"many":[62],"ascertain":[65],"which":[66],"few":[67,360],"interest":[71],"and":[72,115,151,166,188,198,226,288,337],"thus,":[73],"usually":[75],"time":[76,192],"consuming.":[77],"We":[78,172,201,272,380],"developed":[79,203],"an":[80,195],"automatic":[81,114,133,309,366],"method":[82,104,176,276],"identifying":[84],"containing":[86,355],"these":[87,235],"curation":[88,303],"types":[90,216,237,280,285,291,318,351],"among":[91],"large":[93],"pool":[94],"scientific":[97],"based":[99],"on":[100,194,277],"machine":[102],"learning":[103],"Support":[105],"Vector":[106],"Machine":[107],"(SVM).":[108],"classification":[110],"system":[111],"completely":[113,365],"can":[116,177,369,387],"be":[117,178,370],"readily":[118,179,206,371],"applied":[119],"diverse":[121],"types.":[124],"It":[125,297,363],"has":[126,244],"been":[127],"use":[129],"production":[131],"categorization":[134],"10":[136],"different":[137,218,374,377],"datatypes":[139],"process":[143,156,163],"at":[144,164,306,376],"WormBase":[145,307],"past":[148],"two":[149],"years":[150],"it":[152],"being":[158,299],"adopted":[159,180],"FlyBase":[165,287],"Saccharomyces":[168],"Genome":[169],"Database":[170],"(SGD).":[171],"anticipate":[173],"this":[175],"by":[181],"various":[182],"community":[187],"thereby":[189],"greatly":[190,389],"reducing":[191],"spent":[193],"otherwise":[196],"laborious":[197],"demanding":[199],"task.":[200],"also":[202],"simple,":[205],"automated":[207],"procedure":[208],"utilize":[210],"training":[211,265,353],"similar":[214],"bodies":[219],"such":[222],"as":[223],"C.":[224],"elegans":[225],"D.":[227],"melanogaster":[228],"with":[232,315,352],"any":[233],"single":[240,258],"database.":[241],"approach":[243],"great":[245],"significance":[246],"because":[247],"some":[249],"types,":[251],"especially":[252],"those":[253],"low":[255],"occurrence,":[256],"corpus":[259],"often":[260],"does":[261],"not":[262],"have":[263],"enough":[264],"achieve":[268],"satisfactory":[269],"performance.":[270],"RESULTS:":[271],"successfully":[273],"tested":[274],"ten":[278,316],"WormBase,":[282],"fifteen":[283],"three":[289],"Mouse":[293],"Genomics":[294],"Informatics":[295],"(MGI).":[296],"used":[300],"work":[304,384],"flow":[305],"association":[310],"newly":[312],"including":[319],"RNAi,":[320],"antibody,":[321],"phenotype,":[322,334],"gene":[323,328,330,335,338],"regulation,":[324],"mutant":[325],"allele":[326],"sequence,":[327],"expression,":[329],"product":[331],"interaction,":[332,336],"overexpression":[333],"structure":[339],"correction.":[340],"CONCLUSIONS:":[341],"Our":[342],"methods":[343],"are":[344],"applicable":[345],"variety":[348],"set":[354],"several":[356],"hundreds":[357],"thousand":[361],"documents.":[362],"and,":[367],"thus":[368],"incorporated":[372],"workflow":[375],"literature-based":[378],"databases.":[379],"believe":[381],"presented":[385],"here":[386],"contribute":[388],"tremendous":[392],"task":[393],"automating":[395],"important":[397],"yet":[398],"labor-intensive":[399],"effort.":[401]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":6},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":4},{"year":2016,"cited_by_count":3},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":4},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":5}],"updated_date":"2026-06-19T15:47:20.252518","created_date":"2025-10-10T00:00:00"}
