{"id":"https://openalex.org/W1981987714","doi":"https://doi.org/10.1145/2009916.2010080","title":"Tackling class imbalance and data scarcity in literature-based gene function annotation","display_name":"Tackling class imbalance and data scarcity in literature-based gene function annotation","publication_year":2011,"publication_date":"2011-07-24","ids":{"openalex":"https://openalex.org/W1981987714","doi":"https://doi.org/10.1145/2009916.2010080","mag":"1981987714"},"language":"en","primary_location":{"id":"doi:10.1145/2009916.2010080","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2009916.2010080","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 34th international ACM SIGIR conference on Research and development in Information Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049123454","display_name":"Mathieu Blondel","orcid":"https://orcid.org/0000-0002-2366-2993"},"institutions":[{"id":"https://openalex.org/I65837984","display_name":"Kobe University","ror":"https://ror.org/03tgsfw79","country_code":"JP","type":"education","lineage":["https://openalex.org/I65837984"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Mathieu Blondel","raw_affiliation_strings":["Kobe University, Kobe, Japan","[Kobe University, Kobe, JAPAN]"],"affiliations":[{"raw_affiliation_string":"Kobe University, Kobe, Japan","institution_ids":["https://openalex.org/I65837984"]},{"raw_affiliation_string":"[Kobe University, Kobe, JAPAN]","institution_ids":["https://openalex.org/I65837984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103280533","display_name":"Kazuhiro Seki","orcid":"https://orcid.org/0000-0002-1967-4334"},"institutions":[{"id":"https://openalex.org/I65837984","display_name":"Kobe University","ror":"https://ror.org/03tgsfw79","country_code":"JP","type":"education","lineage":["https://openalex.org/I65837984"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kazuhiro Seki","raw_affiliation_strings":["Kobe University, Kobe, Japan","[Kobe University, Kobe, JAPAN]"],"affiliations":[{"raw_affiliation_string":"Kobe University, Kobe, Japan","institution_ids":["https://openalex.org/I65837984"]},{"raw_affiliation_string":"[Kobe University, Kobe, JAPAN]","institution_ids":["https://openalex.org/I65837984"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023847482","display_name":"Kuniaki Uehara","orcid":"https://orcid.org/0000-0002-7160-3752"},"institutions":[{"id":"https://openalex.org/I65837984","display_name":"Kobe University","ror":"https://ror.org/03tgsfw79","country_code":"JP","type":"education","lineage":["https://openalex.org/I65837984"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kuniaki Uehara","raw_affiliation_strings":["Kobe University, Kobe, Japan","[Kobe University, Kobe, JAPAN]"],"affiliations":[{"raw_affiliation_string":"Kobe University, Kobe, Japan","institution_ids":["https://openalex.org/I65837984"]},{"raw_affiliation_string":"[Kobe University, Kobe, JAPAN]","institution_ids":["https://openalex.org/I65837984"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5049123454"],"corresponding_institution_ids":["https://openalex.org/I65837984"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.0617385,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1123","last_page":"1124"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10887","display_name":"Bioinformatics and Genomic Networks","score":0.9840999841690063,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.8190237283706665},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.684432327747345},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.6127630472183228},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6094229221343994},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.5959275364875793},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5778862237930298},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.5549983382225037},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.5033463835716248},{"id":"https://openalex.org/keywords/scarcity","display_name":"Scarcity","score":0.4706149697303772},{"id":"https://openalex.org/keywords/string","display_name":"String (physics)","score":0.4453766644001007},{"id":"https://openalex.org/keywords/string-kernel","display_name":"String kernel","score":0.439485639333725},{"id":"https://openalex.org/keywords/kernel-method","display_name":"Kernel method","score":0.345417857170105},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.24312791228294373},{"id":"https://openalex.org/keywords/radial-basis-function-kernel","display_name":"Radial basis function kernel","score":0.1587962806224823},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.10352125763893127},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09473243355751038}],"concepts":[{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.8190237283706665},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.684432327747345},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.6127630472183228},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6094229221343994},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.5959275364875793},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5778862237930298},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.5549983382225037},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.5033463835716248},{"id":"https://openalex.org/C109747225","wikidata":"https://www.wikidata.org/wiki/Q815758","display_name":"Scarcity","level":2,"score":0.4706149697303772},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.4453766644001007},{"id":"https://openalex.org/C55851704","wikidata":"https://www.wikidata.org/wiki/Q7623983","display_name":"String kernel","level":5,"score":0.439485639333725},{"id":"https://openalex.org/C122280245","wikidata":"https://www.wikidata.org/wiki/Q620622","display_name":"Kernel method","level":3,"score":0.345417857170105},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.24312791228294373},{"id":"https://openalex.org/C75866337","wikidata":"https://www.wikidata.org/wiki/Q7280263","display_name":"Radial basis function kernel","level":4,"score":0.1587962806224823},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.10352125763893127},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09473243355751038},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C37914503","wikidata":"https://www.wikidata.org/wiki/Q156495","display_name":"Mathematical physics","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2009916.2010080","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2009916.2010080","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 34th international ACM SIGIR conference on Research and development in Information Retrieval","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.6800000071525574}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":4,"referenced_works":["https://openalex.org/W1524015530","https://openalex.org/W2096082161","https://openalex.org/W2137346077","https://openalex.org/W2166023018"],"related_works":["https://openalex.org/W152351265","https://openalex.org/W3042295250","https://openalex.org/W4319870840","https://openalex.org/W2163203700","https://openalex.org/W4206904133","https://openalex.org/W1986532736","https://openalex.org/W1975708617","https://openalex.org/W2148753920","https://openalex.org/W3013206934","https://openalex.org/W2020816856"],"abstract_inverted_index":{"In":[0,44],"recent":[1],"years,":[2],"a":[3,49],"number":[4],"of":[5,24],"machine":[6,51],"learning":[7,52],"approaches":[8,40],"to":[9,19,37],"literature-based":[10],"gene":[11],"function":[12],"annotation":[13],"have":[14,33],"been":[15,35],"proposed.":[16],"However,":[17],"due":[18],"issues":[20],"such":[21],"as":[22],"lack":[23],"labeled":[25],"data,":[26],"class":[27],"imbalance":[28],"and":[29],"computational":[30],"cost,":[31],"they":[32],"usually":[34],"unable":[36],"surpass":[38],"simpler":[39],"based":[41,54],"on":[42,55],"string-matching.":[43],"this":[45],"paper,":[46],"we":[47],"propose":[48],"principled":[50],"approach":[53],"kernel":[56],"classifiers.":[57]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
