{"id":"https://openalex.org/W2131887446","doi":"https://doi.org/10.1186/1471-2105-10-403","title":"Investigating heterogeneous protein annotations toward cross-corpora utilization","display_name":"Investigating heterogeneous protein annotations toward cross-corpora utilization","publication_year":2009,"publication_date":"2009-12-01","ids":{"openalex":"https://openalex.org/W2131887446","doi":"https://doi.org/10.1186/1471-2105-10-403","mag":"2131887446","pmid":"https://pubmed.ncbi.nlm.nih.gov/19995463"},"language":"en","primary_location":{"id":"doi:10.1186/1471-2105-10-403","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-10-403","pdf_url":"https://bmcbioinformatics.biomedcentral.com/track/pdf/10.1186/1471-2105-10-403","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://bmcbioinformatics.biomedcentral.com/track/pdf/10.1186/1471-2105-10-403","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100371984","display_name":"Yue Wang","orcid":"https://orcid.org/0000-0002-0278-2347"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]},{"id":"https://openalex.org/I161296585","display_name":"Tokyo University of Science","ror":"https://ror.org/05sj3n476","country_code":"JP","type":"education","lineage":["https://openalex.org/I161296585"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Yue Wang","raw_affiliation_strings":["Department of Computer Science, School of Information Science and Technology, University of Tokyo, Tokyo, Japan. wangyue@is.s.u-tokyo.ac.jp","Department of Computer Science, School of Information Science and Technology, University of Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, School of Information Science and Technology, University of Tokyo, Tokyo, Japan. wangyue@is.s.u-tokyo.ac.jp","institution_ids":["https://openalex.org/I161296585"]},{"raw_affiliation_string":"Department of Computer Science, School of Information Science and Technology, University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063923711","display_name":"Jin-Dong Kim","orcid":"https://orcid.org/0000-0001-9660-6303"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Jin-Dong Kim","raw_affiliation_strings":["Department of Computer Science, School of Information Science and Technology, University of Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, School of Information Science and Technology, University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044967495","display_name":"Rune S\u00e6tre","orcid":null},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Rune S\u00e6tre","raw_affiliation_strings":["Department of Computer Science, School of Information Science and Technology, University of Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, School of Information Science and Technology, University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066925770","display_name":"Sampo Pyysalo","orcid":"https://orcid.org/0000-0002-6279-5000"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Sampo Pyysalo","raw_affiliation_strings":["Department of Computer Science, School of Information Science and Technology, University of Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, School of Information Science and Technology, University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112241147","display_name":"Jun\u2019ichi Tsujii","orcid":null},"institutions":[{"id":"https://openalex.org/I28407311","display_name":"University of Manchester","ror":"https://ror.org/027m9bs27","country_code":"GB","type":"education","lineage":["https://openalex.org/I28407311"]},{"id":"https://openalex.org/I4210112368","display_name":"National Centre for Atmospheric Science","ror":"https://ror.org/01wwwe276","country_code":"GB","type":"nonprofit","lineage":["https://openalex.org/I141816643","https://openalex.org/I4210087105","https://openalex.org/I4210112368"]},{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["GB","JP"],"is_corresponding":false,"raw_author_name":"Jun'ichi Tsujii","raw_affiliation_strings":["Department of Computer Science, School of Information Science and Technology, University of Tokyo, Tokyo, Japan","National Center for Text Mining, University of Manchester, Manchester, UK","School of Computer Science, University of Manchester, Manchester, UK"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, School of Information Science and Technology, University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]},{"raw_affiliation_string":"National Center for Text Mining, University of Manchester, Manchester, UK","institution_ids":["https://openalex.org/I4210112368"]},{"raw_affiliation_string":"School of Computer Science, University of Manchester, Manchester, UK","institution_ids":["https://openalex.org/I28407311"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100371984"],"corresponding_institution_ids":["https://openalex.org/I161296585","https://openalex.org/I74801974"],"apc_list":{"value":1690,"currency":"GBP","value_usd":2072},"apc_paid":{"value":1690,"currency":"GBP","value_usd":2072},"fwci":1.4782,"has_fulltext":true,"cited_by_count":24,"citation_normalized_percentile":{"value":0.81731935,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"10","issue":"1","first_page":"403","last_page":"403"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9908000230789185,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8732448816299438},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.8126736879348755},{"id":"https://openalex.org/keywords/named-entity-recognition","display_name":"Named-entity recognition","score":0.6564191579818726},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.645523726940155},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5787123441696167},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.48362934589385986},{"id":"https://openalex.org/keywords/named-entity","display_name":"Named entity","score":0.46624961495399475},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4385386109352112},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.43229764699935913}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8732448816299438},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.8126736879348755},{"id":"https://openalex.org/C2779135771","wikidata":"https://www.wikidata.org/wiki/Q403574","display_name":"Named-entity recognition","level":3,"score":0.6564191579818726},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.645523726940155},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5787123441696167},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.48362934589385986},{"id":"https://openalex.org/C2777889803","wikidata":"https://www.wikidata.org/wiki/Q25047676","display_name":"Named entity","level":2,"score":0.46624961495399475},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4385386109352112},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.43229764699935913},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[{"descriptor_ui":"D005796","descriptor_name":"Genes","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D005796","descriptor_name":"Genes","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D005796","descriptor_name":"Genes","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D005796","descriptor_name":"Genes","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D010363","descriptor_name":"Pattern Recognition, Automated","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D010363","descriptor_name":"Pattern Recognition, Automated","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D010363","descriptor_name":"Pattern Recognition, Automated","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D010363","descriptor_name":"Pattern Recognition, Automated","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false}],"locations_count":4,"locations":[{"id":"doi:10.1186/1471-2105-10-403","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-10-403","pdf_url":"https://bmcbioinformatics.biomedcentral.com/track/pdf/10.1186/1471-2105-10-403","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},{"id":"pmid:19995463","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/19995463","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC bioinformatics","raw_type":null},{"id":"pmh:oai:doaj.org/article:efb4664072a842d9bdfbd1bfc61ff9da","is_oa":true,"landing_page_url":"https://doaj.org/article/efb4664072a842d9bdfbd1bfc61ff9da","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BMC Bioinformatics, Vol 10, Iss 1, p 403 (2009)","raw_type":"article"},{"id":"pmh:oai:pubmedcentral.nih.gov:2804683","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/2804683","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BMC Bioinformatics","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1186/1471-2105-10-403","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-10-403","pdf_url":"https://bmcbioinformatics.biomedcentral.com/track/pdf/10.1186/1471-2105-10-403","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.6399999856948853}],"awards":[{"id":"https://openalex.org/G6267471473","display_name":null,"funder_award_id":"Grant-in-Aid","funder_id":"https://openalex.org/F4320320912","funder_display_name":"Ministry of Education, Culture, Sports, Science and Technology"},{"id":"https://openalex.org/G7599130655","display_name":null,"funder_award_id":"Grant","funder_id":"https://openalex.org/F4320320912","funder_display_name":"Ministry of Education, Culture, Sports, Science and Technology"},{"id":"https://openalex.org/G8044579487","display_name":null,"funder_award_id":"Japan","funder_id":"https://openalex.org/F4320320912","funder_display_name":"Ministry of Education, Culture, Sports, Science and Technology"}],"funders":[{"id":"https://openalex.org/F4320320912","display_name":"Ministry of Education, Culture, Sports, Science and Technology","ror":"https://ror.org/048rj2z13"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2131887446.pdf","grobid_xml":"https://content.openalex.org/works/W2131887446.grobid-xml"},"referenced_works_count":37,"referenced_works":["https://openalex.org/W1482328859","https://openalex.org/W1487177365","https://openalex.org/W1747861911","https://openalex.org/W1823542770","https://openalex.org/W1932968309","https://openalex.org/W1968848598","https://openalex.org/W1981276685","https://openalex.org/W1995945562","https://openalex.org/W2047782770","https://openalex.org/W2048140075","https://openalex.org/W2057399676","https://openalex.org/W2058412233","https://openalex.org/W2058856481","https://openalex.org/W2061327015","https://openalex.org/W2070786957","https://openalex.org/W2091803989","https://openalex.org/W2102419107","https://openalex.org/W2112670696","https://openalex.org/W2120253533","https://openalex.org/W2120354757","https://openalex.org/W2121844933","https://openalex.org/W2126276057","https://openalex.org/W2134769633","https://openalex.org/W2151698208","https://openalex.org/W2156515921","https://openalex.org/W2157762168","https://openalex.org/W2163107094","https://openalex.org/W2163362093","https://openalex.org/W2166474856","https://openalex.org/W2168905447","https://openalex.org/W2607354300","https://openalex.org/W2793828080","https://openalex.org/W2989631226","https://openalex.org/W2990138404","https://openalex.org/W3082731548","https://openalex.org/W3106889297","https://openalex.org/W4230980737"],"related_works":["https://openalex.org/W2032007337","https://openalex.org/W4377865234","https://openalex.org/W2186562580","https://openalex.org/W2078793151","https://openalex.org/W2155874911","https://openalex.org/W1884363728","https://openalex.org/W4390279576","https://openalex.org/W3128216712","https://openalex.org/W3005759282","https://openalex.org/W3017222382"],"abstract_inverted_index":{"Our":[0],"analysis":[1],"covers":[2],"the":[3,11,23,26,39,48],"key":[4],"similarities":[5],"and":[6],"dissimilarities":[7],"that":[8,44],"exist":[9],"among":[10],"diverse":[12],"gene/protein":[13],"corpora.":[14,49],"This":[15],"paper":[16],"serves":[17],"to":[18,34],"improve":[19],"our":[20],"understanding":[21,37],"of":[22,38,41],"differences":[24],"in":[25],"three":[27],"studied":[28],"corpora,":[29],"which":[30],"can":[31],"then":[32],"lead":[33],"a":[35],"better":[36],"performance":[40],"protein":[42],"recognizers":[43],"are":[45],"based":[46],"on":[47]},"counts_by_year":[{"year":2020,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2014,"cited_by_count":4},{"year":2013,"cited_by_count":7},{"year":2012,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
