{"id":"https://openalex.org/W2167289895","doi":"https://doi.org/10.1093/bioinformatics/bti084","title":"Automatic extraction of gene/protein biological functions from biomedical text","display_name":"Automatic extraction of gene/protein biological functions from biomedical text","publication_year":2004,"publication_date":"2004-10-27","ids":{"openalex":"https://openalex.org/W2167289895","doi":"https://doi.org/10.1093/bioinformatics/bti084","mag":"2167289895"},"language":"en","primary_location":{"id":"doi:10.1093/bioinformatics/bti084","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/bti084","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/21/7/1227/748704/bti084.pdf","source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://academic.oup.com/bioinformatics/article-pdf/21/7/1227/748704/bti084.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102170852","display_name":"Asako Koike","orcid":null},"institutions":[{"id":"https://openalex.org/I65143321","display_name":"Hitachi (Japan)","ror":"https://ror.org/02exqgm79","country_code":"JP","type":"company","lineage":["https://openalex.org/I65143321"]},{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Asako Koike","raw_affiliation_strings":["Central Research Laboratory, Hitachi Ltd., 1-280 Higashi-koigakubo, Kokubunji City, Tokyo 185-8601, Japan","Department of Computational Biology, Graduate School of Frontier Science, The University of Tokyo, Kiban-3A1(CB01) 5-1-5, Kashiwanoha Kashiwa, Chiba 277-8561, Japan and"],"affiliations":[{"raw_affiliation_string":"Central Research Laboratory, Hitachi Ltd., 1-280 Higashi-koigakubo, Kokubunji City, Tokyo 185-8601, Japan","institution_ids":["https://openalex.org/I65143321"]},{"raw_affiliation_string":"Department of Computational Biology, Graduate School of Frontier Science, The University of Tokyo, Kiban-3A1(CB01) 5-1-5, Kashiwanoha Kashiwa, Chiba 277-8561, Japan and","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110769241","display_name":"Yoshiki Niwa","orcid":null},"institutions":[{"id":"https://openalex.org/I65143321","display_name":"Hitachi (Japan)","ror":"https://ror.org/02exqgm79","country_code":"JP","type":"company","lineage":["https://openalex.org/I65143321"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yoshiki Niwa","raw_affiliation_strings":["Central Research Laboratory, Hitachi Ltd., 1-280 Higashi-koigakubo, Kokubunji City, Tokyo 185-8601, Japan"],"affiliations":[{"raw_affiliation_string":"Central Research Laboratory, Hitachi Ltd., 1-280 Higashi-koigakubo, Kokubunji City, Tokyo 185-8601, Japan","institution_ids":["https://openalex.org/I65143321"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5104355283","display_name":"Toshihisa Takagi","orcid":null},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Toshihisa Takagi","raw_affiliation_strings":["Department of Computational Biology, Graduate School of Frontier Science, The University of Tokyo, Kiban-3A1(CB01) 5-1-5, Kashiwanoha Kashiwa, Chiba 277-8561, Japan and"],"affiliations":[{"raw_affiliation_string":"Department of Computational Biology, Graduate School of Frontier Science, The University of Tokyo, Kiban-3A1(CB01) 5-1-5, Kashiwanoha Kashiwa, Chiba 277-8561, Japan and","institution_ids":["https://openalex.org/I74801974"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5102170852"],"corresponding_institution_ids":["https://openalex.org/I65143321","https://openalex.org/I74801974"],"apc_list":{"value":3618,"currency":"USD","value_usd":3618},"apc_paid":null,"fwci":3.3763,"has_fulltext":true,"cited_by_count":80,"citation_normalized_percentile":{"value":0.92935937,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"21","issue":"7","first_page":"1227","last_page":"1236"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9891999959945679,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.9886000156402588,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6559113264083862},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.6162229180335999},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.5355204343795776},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.485067754983902},{"id":"https://openalex.org/keywords/gene-ontology","display_name":"Gene ontology","score":0.47045695781707764},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.45444923639297485},{"id":"https://openalex.org/keywords/gene-family","display_name":"Gene family","score":0.4534755051136017},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4188459515571594},{"id":"https://openalex.org/keywords/protein-family","display_name":"Protein family","score":0.41315871477127075},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35506418347358704},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.3415825068950653},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.33071327209472656},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.22219902276992798},{"id":"https://openalex.org/keywords/genome","display_name":"Genome","score":0.1579599678516388},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.15546196699142456},{"id":"https://openalex.org/keywords/gene-expression","display_name":"Gene expression","score":0.12747907638549805}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6559113264083862},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.6162229180335999},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.5355204343795776},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.485067754983902},{"id":"https://openalex.org/C2987395477","wikidata":"https://www.wikidata.org/wiki/Q135085","display_name":"Gene ontology","level":4,"score":0.47045695781707764},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.45444923639297485},{"id":"https://openalex.org/C5911399","wikidata":"https://www.wikidata.org/wiki/Q2278983","display_name":"Gene family","level":4,"score":0.4534755051136017},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4188459515571594},{"id":"https://openalex.org/C171897839","wikidata":"https://www.wikidata.org/wiki/Q417841","display_name":"Protein family","level":3,"score":0.41315871477127075},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35506418347358704},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.3415825068950653},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.33071327209472656},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.22219902276992798},{"id":"https://openalex.org/C141231307","wikidata":"https://www.wikidata.org/wiki/Q7020","display_name":"Genome","level":3,"score":0.1579599678516388},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.15546196699142456},{"id":"https://openalex.org/C150194340","wikidata":"https://www.wikidata.org/wiki/Q26972","display_name":"Gene expression","level":3,"score":0.12747907638549805}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1093/bioinformatics/bti084","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/bti084","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/21/7/1227/748704/bti084.pdf","source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.138.707","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.138.707","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://bioinformatics.oxfordjournals.org/cgi/reprint/bti084v1.pdf","raw_type":"text"}],"best_oa_location":{"id":"doi:10.1093/bioinformatics/bti084","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/bti084","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/21/7/1227/748704/bti084.pdf","source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.7599999904632568}],"awards":[{"id":"https://openalex.org/G12401395","display_name":null,"funder_award_id":"Technology","funder_id":"https://openalex.org/F4320320912","funder_display_name":"Ministry of Education, Culture, Sports, Science and Technology"},{"id":"https://openalex.org/G8044579487","display_name":null,"funder_award_id":"Japan","funder_id":"https://openalex.org/F4320320912","funder_display_name":"Ministry of Education, Culture, Sports, Science and Technology"}],"funders":[{"id":"https://openalex.org/F4320320912","display_name":"Ministry of Education, Culture, Sports, Science and Technology","ror":"https://ror.org/048rj2z13"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2167289895.pdf","grobid_xml":"https://content.openalex.org/works/W2167289895.grobid-xml"},"referenced_works_count":25,"referenced_works":["https://openalex.org/W1491978778","https://openalex.org/W1526873677","https://openalex.org/W1527263662","https://openalex.org/W1592053870","https://openalex.org/W1980586944","https://openalex.org/W1987213598","https://openalex.org/W1992770405","https://openalex.org/W1999117234","https://openalex.org/W2000569744","https://openalex.org/W2023736097","https://openalex.org/W2099393019","https://openalex.org/W2101595316","https://openalex.org/W2103017472","https://openalex.org/W2103907281","https://openalex.org/W2106093878","https://openalex.org/W2142574443","https://openalex.org/W2144001613","https://openalex.org/W2158505321","https://openalex.org/W2160521949","https://openalex.org/W2161890636","https://openalex.org/W2165612380","https://openalex.org/W2314420468","https://openalex.org/W4234200495","https://openalex.org/W4240541971","https://openalex.org/W6725524006"],"related_works":["https://openalex.org/W2349587167","https://openalex.org/W2797565378","https://openalex.org/W2080517113","https://openalex.org/W3154956619","https://openalex.org/W2889112813","https://openalex.org/W2089457640","https://openalex.org/W2055793566","https://openalex.org/W1980836133","https://openalex.org/W2229695611","https://openalex.org/W2052343958"],"abstract_inverted_index":{"Abstract":[0],"Motivation:":[1],"With":[2],"the":[3,10,16,46,71,94,113,119,127,140,185],"rapid":[4],"advancement":[5],"of":[6,12,18,21,33,42,51,75,105,110,139,169,174],"biomedical":[7,24],"science":[8],"and":[9,88,97,107,155,194],"development":[11],"high-throughput":[13,43],"analysis":[14,91],"methods,":[15],"extraction":[17,50],"various":[19],"types":[20],"information":[22,52],"from":[23,57,82],"text":[25,58,83],"has":[26,59,165],"become":[27],"critical.":[28],"Since":[29],"automatic":[30,49],"functional":[31,146],"annotations":[32],"genes":[34],"are":[35,100,116,124,207],"quite":[36],"useful":[37],"for":[38,48,68,176,199],"interpreting":[39],"large":[40],"amounts":[41],"data":[44],"efficiently,":[45],"demand":[47],"related":[53],"to":[54,118,184],"gene":[55,205],"functions":[56,74,99,179,206],"been":[60],"increasing.":[61],"Results:":[62],"We":[63],"have":[64],"developed":[65,131],"a":[66,85,172],"method":[67,164],"automatically":[69],"extracting":[70],"biological":[72],"process":[73],"genes/protein/families":[76],"based":[77,148],"on":[78,149],"Gene":[79],"Ontology":[80],"(GO)":[81],"using":[84,126,151],"shallow":[86],"parser":[87],"sentence":[89],"structure":[90],"techniques.":[92,157],"When":[93,182],"gene/protein/family":[95,122,128,141],"names":[96,123],"their":[98],"described":[101,178],"in":[102,180],"ACTOR":[103],"(doer":[104],"action)":[106,111],"OBJECT":[108],"(receiver":[109],"relationships,":[112],"corresponding":[114],"GO-IDs":[115],"assigned":[117],"genes/proteins/families.":[120],"The":[121,203],"recognized":[125],"name":[129],"dictionaries":[130],"by":[132],"our":[133,163],"group.":[134],"To":[135],"achieve":[136],"wide":[137],"recognition":[138],"functions,":[142],"we":[143],"semi-automatically":[144],"gather":[145],"terms":[147],"GO":[150],"co-occurrence,":[152],"collocation":[153],"similarities":[154],"rule-based":[156],"A":[158],"preliminary":[159],"experiment":[160],"demonstrated":[161],"that":[162],"an":[166],"estimated":[167],"recall":[168],"54\u201364%":[170],"with":[171],"precision":[173],"91\u201394%":[175],"actually":[177],"abstracts.":[181],"applied":[183],"PUBMED,":[186],"it":[187],"extracted":[188,204],"over":[189],"190":[190],"000":[191,196],"gene\u2013GO":[192],"relationships":[193,198],"150":[195],"family\u2013GO":[197],"major":[200],"eukaryotes.":[201],"Availability:":[202],"available":[208],"at":[209],"http://prime.ontology.ims.u-tokyo.ac.jp":[210],"Contact:":[211],"akoike@hgc.jp":[212]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":3},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":5},{"year":2016,"cited_by_count":1},{"year":2014,"cited_by_count":5},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
