{"id":"https://openalex.org/W4313525421","doi":"https://doi.org/10.1109/bibm55620.2022.9995448","title":"Comprehensive Assessment of OCR Tools for Gene Name Recognition in Biological Pathway Figures","display_name":"Comprehensive Assessment of OCR Tools for Gene Name Recognition in Biological Pathway Figures","publication_year":2022,"publication_date":"2022-12-06","ids":{"openalex":"https://openalex.org/W4313525421","doi":"https://doi.org/10.1109/bibm55620.2022.9995448"},"language":"en","primary_location":{"id":"doi:10.1109/bibm55620.2022.9995448","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibm55620.2022.9995448","pdf_url":null,"source":{"id":"https://openalex.org/S4363607730","display_name":"2022 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048345805","display_name":"Stuart Aldrich","orcid":null},"institutions":[{"id":"https://openalex.org/I76835614","display_name":"University of Missouri","ror":"https://ror.org/02ymw8z06","country_code":"US","type":"education","lineage":["https://openalex.org/I76835614"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Stuart Aldrich","raw_affiliation_strings":["University of Missouri,Department of Electrical Engineering and Computer Science,Columbia,Missouri,USA","Department of Electrical Engineering and Computer Science, University of Missouri, Columbia, Missouri, USA"],"affiliations":[{"raw_affiliation_string":"University of Missouri,Department of Electrical Engineering and Computer Science,Columbia,Missouri,USA","institution_ids":["https://openalex.org/I76835614"]},{"raw_affiliation_string":"Department of Electrical Engineering and Computer Science, University of Missouri, Columbia, Missouri, USA","institution_ids":["https://openalex.org/I76835614"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022507170","display_name":"Micheal Olaolu Arowolo","orcid":"https://orcid.org/0000-0002-9418-5346"},"institutions":[{"id":"https://openalex.org/I76835614","display_name":"University of Missouri","ror":"https://ror.org/02ymw8z06","country_code":"US","type":"education","lineage":["https://openalex.org/I76835614"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Micheal Olaolu Arowolo","raw_affiliation_strings":["University of Missouri,Department of Electrical Engineering and Computer Science,Columbia,Missouri,USA","Department of Electrical Engineering and Computer Science, University of Missouri, Columbia, Missouri, USA"],"affiliations":[{"raw_affiliation_string":"University of Missouri,Department of Electrical Engineering and Computer Science,Columbia,Missouri,USA","institution_ids":["https://openalex.org/I76835614"]},{"raw_affiliation_string":"Department of Electrical Engineering and Computer Science, University of Missouri, Columbia, Missouri, USA","institution_ids":["https://openalex.org/I76835614"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087149818","display_name":"Fei He","orcid":"https://orcid.org/0000-0002-3284-9506"},"institutions":[{"id":"https://openalex.org/I184983240","display_name":"Northeast Normal University","ror":"https://ror.org/02rkvz144","country_code":"CN","type":"education","lineage":["https://openalex.org/I184983240"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fei He","raw_affiliation_strings":["Northeast Normal University,College of Information Science and Technology,Changchun,China","College of Information Science and Technology, Northeast Normal University, Changchun, China"],"affiliations":[{"raw_affiliation_string":"Northeast Normal University,College of Information Science and Technology,Changchun,China","institution_ids":["https://openalex.org/I184983240"]},{"raw_affiliation_string":"College of Information Science and Technology, Northeast Normal University, Changchun, China","institution_ids":["https://openalex.org/I184983240"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060329217","display_name":"Mihail Popescu","orcid":"https://orcid.org/0000-0002-6145-8096"},"institutions":[{"id":"https://openalex.org/I2800649613","display_name":"University of Missouri Health System","ror":"https://ror.org/03yp8z857","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I2800649613"]},{"id":"https://openalex.org/I76835614","display_name":"University of Missouri","ror":"https://ror.org/02ymw8z06","country_code":"US","type":"education","lineage":["https://openalex.org/I76835614"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mihail Popescu","raw_affiliation_strings":["University of Missouri,Department of Health Management and Informatics,Columbia,Missouri,USA","Department of Health Management and Informatics, University of Missouri, Columbia, Missouri, USA"],"affiliations":[{"raw_affiliation_string":"University of Missouri,Department of Health Management and Informatics,Columbia,Missouri,USA","institution_ids":["https://openalex.org/I2800649613"]},{"raw_affiliation_string":"Department of Health Management and Informatics, University of Missouri, Columbia, Missouri, USA","institution_ids":["https://openalex.org/I2800649613","https://openalex.org/I76835614"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5082428303","display_name":"Dong Xu","orcid":"https://orcid.org/0000-0002-4809-0514"},"institutions":[{"id":"https://openalex.org/I76835614","display_name":"University of Missouri","ror":"https://ror.org/02ymw8z06","country_code":"US","type":"education","lineage":["https://openalex.org/I76835614"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dong Xu","raw_affiliation_strings":["University of Missouri,Department of Electrical Engineering and Computer Science,Columbia,Missouri,USA","Department of Electrical Engineering and Computer Science, University of Missouri, Columbia, Missouri, USA"],"affiliations":[{"raw_affiliation_string":"University of Missouri,Department of Electrical Engineering and Computer Science,Columbia,Missouri,USA","institution_ids":["https://openalex.org/I76835614"]},{"raw_affiliation_string":"Department of Electrical Engineering and Computer Science, University of Missouri, Columbia, Missouri, USA","institution_ids":["https://openalex.org/I76835614"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5048345805"],"corresponding_institution_ids":["https://openalex.org/I76835614"],"apc_list":null,"apc_paid":null,"fwci":1.3232,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.81962025,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"3574","last_page":"3579"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9926000237464905,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/alphanumeric","display_name":"Alphanumeric","score":0.885469913482666},{"id":"https://openalex.org/keywords/optical-character-recognition","display_name":"Optical character recognition","score":0.7425664663314819},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6920349597930908},{"id":"https://openalex.org/keywords/kegg","display_name":"KEGG","score":0.607437789440155},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48533979058265686},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4209803342819214},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.3906075060367584},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.35873275995254517},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.21195024251937866},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.1481437087059021},{"id":"https://openalex.org/keywords/gene-expression","display_name":"Gene expression","score":0.12302884459495544},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.10001063346862793},{"id":"https://openalex.org/keywords/gene-ontology","display_name":"Gene ontology","score":0.07595854997634888}],"concepts":[{"id":"https://openalex.org/C2781003394","wikidata":"https://www.wikidata.org/wiki/Q737372","display_name":"Alphanumeric","level":2,"score":0.885469913482666},{"id":"https://openalex.org/C546480517","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Optical character recognition","level":3,"score":0.7425664663314819},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6920349597930908},{"id":"https://openalex.org/C152724338","wikidata":"https://www.wikidata.org/wiki/Q909442","display_name":"KEGG","level":5,"score":0.607437789440155},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48533979058265686},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4209803342819214},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.3906075060367584},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.35873275995254517},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.21195024251937866},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.1481437087059021},{"id":"https://openalex.org/C150194340","wikidata":"https://www.wikidata.org/wiki/Q26972","display_name":"Gene expression","level":3,"score":0.12302884459495544},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.10001063346862793},{"id":"https://openalex.org/C2987395477","wikidata":"https://www.wikidata.org/wiki/Q135085","display_name":"Gene ontology","level":4,"score":0.07595854997634888},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bibm55620.2022.9995448","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bibm55620.2022.9995448","pdf_url":null,"source":{"id":"https://openalex.org/S4363607730","display_name":"2022 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.4399999976158142}],"awards":[],"funders":[{"id":"https://openalex.org/F4320338440","display_name":"HORIZON EUROPE Health","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W1968738535","https://openalex.org/W2097601945","https://openalex.org/W2102672399","https://openalex.org/W2145819879","https://openalex.org/W2159584465","https://openalex.org/W2160591663","https://openalex.org/W2169279258","https://openalex.org/W2171970585","https://openalex.org/W2506255128","https://openalex.org/W2741809807","https://openalex.org/W2884972436","https://openalex.org/W2969718750","https://openalex.org/W3045882047","https://openalex.org/W3101791085","https://openalex.org/W4205730624","https://openalex.org/W4293218986","https://openalex.org/W4294216483","https://openalex.org/W4307425304","https://openalex.org/W6753222870"],"related_works":["https://openalex.org/W2049379968","https://openalex.org/W4200491602","https://openalex.org/W3210847758","https://openalex.org/W3015507988","https://openalex.org/W3044341113","https://openalex.org/W2956037940","https://openalex.org/W3006692928","https://openalex.org/W4401524754","https://openalex.org/W4385187174","https://openalex.org/W2486949231"],"abstract_inverted_index":{"Optical":[0],"Character":[1],"Recognition":[2],"(OCR)":[3],"is":[4,40],"becoming":[5],"more":[6,8],"and":[7,72,101,119,124,141],"effective":[9],"in":[10,13,18,26,36,45,79,95,150],"text":[11],"detection":[12],"images.":[14,92],"However,":[15],"OCR\u2019s":[16],"performance":[17],"special":[19],"applications":[20],"may":[21],"vary.":[22],"In":[23],"particular,":[24],"OCR":[25,105],"visual":[27],"representations":[28],"of":[29,60,116],"complex":[30],"processes":[31],"known":[32],"as":[33],"pathway":[34,47,61,91,112,130,151],"figures":[35,62],"the":[37,51,57,96],"biomedical":[38],"literature":[39],"challenging.":[41],"The":[42],"information":[43],"depicted":[44],"a":[46,84],"graphic":[48],"usually":[49],"represents":[50],"article\u2019s":[52],"most":[53],"important":[54],"conclusions.":[55],"Still,":[56],"huge":[58],"number":[59],"cannot":[63],"be":[64],"automatically":[65],"processed":[66],"for":[67,146],"large-scale":[68],"search,":[69],"data":[70,126],"mining,":[71],"downstream":[73],"analysis.":[74],"Assisted":[75],"by":[76],"recent":[77],"developments":[78],"OCR,":[80],"we":[81,98],"have":[82],"developed":[83],"method":[85],"to":[86],"extract":[87],"gene":[88,120,147],"names":[89,121],"from":[90,110,122],"For":[93],"usage":[94],"method,":[97],"thoroughly":[99],"evaluated":[100],"compared":[102],"major":[103],"available":[104],"tools":[106],"using":[107],"563":[108],"genes":[109,131],"45":[111],"images,":[113],"1000":[114],"images":[115],"alphanumeric":[117],"characters":[118],"HUGO,":[123],"KEGG":[125],"with":[127],"20":[128],"random":[129],"curated":[132],"routes.":[133],"Our":[134],"study":[135],"showed":[136],"that":[137],"Google":[138],"Cloud":[139],"Vision":[140],"MMOCR":[142],"are":[143],"best":[144],"suitable":[145],"name":[148],"recognition":[149],"figures.":[152]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
