{"id":"https://openalex.org/W4400679085","doi":"https://doi.org/10.1109/tcbb.2024.3429234","title":"Enhancing Generalizability in Biomedical Entity Recognition: Self-Attention PCA-CLS Model","display_name":"Enhancing Generalizability in Biomedical Entity Recognition: Self-Attention PCA-CLS Model","publication_year":2024,"publication_date":"2024-07-16","ids":{"openalex":"https://openalex.org/W4400679085","doi":"https://doi.org/10.1109/tcbb.2024.3429234","pmid":"https://pubmed.ncbi.nlm.nih.gov/39012749"},"language":"en","primary_location":{"id":"doi:10.1109/tcbb.2024.3429234","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcbb.2024.3429234","pdf_url":null,"source":{"id":"https://openalex.org/S36029991","display_name":"IEEE/ACM Transactions on Computational Biology and Bioinformatics","issn_l":"1545-5963","issn":["1545-5963","1557-9964","2374-0043"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Computational Biology and Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003314662","display_name":"Rajesh Kumar Mundotiya","orcid":"https://orcid.org/0000-0002-0096-2440"},"institutions":[{"id":"https://openalex.org/I4210121466","display_name":"Indian Institute of Technology Bhilai","ror":"https://ror.org/02sscsx71","country_code":"IN","type":"education","lineage":["https://openalex.org/I4210121466"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Rajesh Kumar Mundotiya","raw_affiliation_strings":["Department of Computer Science &#x0026; Engineering, Indian Institute of Technology Bhilai, Bhilai, Chhattisgarh, India","Department of Computer Science &amp; Engineering, Indian Institute of Technology Bhilai, India"],"raw_orcid":"https://orcid.org/0000-0002-0096-2440","affiliations":[{"raw_affiliation_string":"Department of Computer Science &#x0026; Engineering, Indian Institute of Technology Bhilai, Bhilai, Chhattisgarh, India","institution_ids":["https://openalex.org/I4210121466"]},{"raw_affiliation_string":"Department of Computer Science &amp; Engineering, Indian Institute of Technology Bhilai, India","institution_ids":["https://openalex.org/I4210121466"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113241020","display_name":"J. Likhitha Priya","orcid":null},"institutions":[{"id":"https://openalex.org/I1310439424","display_name":"Accenture (Switzerland)","ror":"https://ror.org/041r3e346","country_code":"CH","type":"company","lineage":["https://openalex.org/I1310439424","https://openalex.org/I4210093804"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Juhi Priya","raw_affiliation_strings":["Accenture-ATCI, SEZ, Bangalore, Karnataka, India","Accenture-ATCI, SEZ, Bangalore, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Accenture-ATCI, SEZ, Bangalore, Karnataka, India","institution_ids":["https://openalex.org/I1310439424"]},{"raw_affiliation_string":"Accenture-ATCI, SEZ, Bangalore, India","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104601348","display_name":"Divya Kuwarbi","orcid":null},"institutions":[{"id":"https://openalex.org/I1343973766","display_name":"Acxiom (United States)","ror":"https://ror.org/00pv14226","country_code":"US","type":"company","lineage":["https://openalex.org/I1343973766"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Divya Kuwarbi","raw_affiliation_strings":["Acxiom Technologies, Mumbai, Maharashtra, India","Acxiom Technologies, Rustomjee Central Park, Andheri East, Mumbai, India"],"raw_orcid":"https://orcid.org/0009-0003-5234-9802","affiliations":[{"raw_affiliation_string":"Acxiom Technologies, Mumbai, Maharashtra, India","institution_ids":["https://openalex.org/I1343973766"]},{"raw_affiliation_string":"Acxiom Technologies, Rustomjee Central Park, Andheri East, Mumbai, India","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102879014","display_name":"Teekam Singh","orcid":"https://orcid.org/0000-0003-4819-9402"},"institutions":[{"id":"https://openalex.org/I60054993","display_name":"Graphic Era University","ror":"https://ror.org/03wqgqd89","country_code":"IN","type":"education","lineage":["https://openalex.org/I60054993"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Teekam Singh","raw_affiliation_strings":["Department of Computer Science and Engineering, Graphic Era Deemed to be University Dehradun, Dehradun, Uttarakhand, India","Department of Computer Science and Engineering, Graphic Era Deemed to be University Dehradun, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Graphic Era Deemed to be University Dehradun, Dehradun, Uttarakhand, India","institution_ids":["https://openalex.org/I60054993"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, Graphic Era Deemed to be University Dehradun, India","institution_ids":["https://openalex.org/I60054993"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5003314662"],"corresponding_institution_ids":["https://openalex.org/I4210121466"],"apc_list":null,"apc_paid":null,"fwci":0.6531,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.73621887,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":"21","issue":"6","first_page":"1934","last_page":"1941"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.9419000148773193,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.9419000148773193,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9027000069618225,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generalizability-theory","display_name":"Generalizability theory","score":0.8744029998779297},{"id":"https://openalex.org/keywords/cls-upper-limits","display_name":"CLs upper limits","score":0.7274085283279419},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.43046462535858154},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.3842490315437317},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.35405588150024414},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3255699872970581},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.25475332140922546},{"id":"https://openalex.org/keywords/developmental-psychology","display_name":"Developmental psychology","score":0.10018622875213623}],"concepts":[{"id":"https://openalex.org/C27158222","wikidata":"https://www.wikidata.org/wiki/Q5532422","display_name":"Generalizability theory","level":2,"score":0.8744029998779297},{"id":"https://openalex.org/C190729725","wikidata":"https://www.wikidata.org/wiki/Q5012817","display_name":"CLs upper limits","level":2,"score":0.7274085283279419},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.43046462535858154},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3842490315437317},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35405588150024414},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3255699872970581},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.25475332140922546},{"id":"https://openalex.org/C138496976","wikidata":"https://www.wikidata.org/wiki/Q175002","display_name":"Developmental psychology","level":1,"score":0.10018622875213623},{"id":"https://openalex.org/C119767625","wikidata":"https://www.wikidata.org/wiki/Q618211","display_name":"Optometry","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000098415","descriptor_name":"Convolutional Neural Networks","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000098415","descriptor_name":"Convolutional Neural Networks","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000098415","descriptor_name":"Convolutional Neural Networks","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009323","descriptor_name":"Natural Language Processing","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D009323","descriptor_name":"Natural Language Processing","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D009323","descriptor_name":"Natural Language Processing","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D009323","descriptor_name":"Natural Language Processing","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009323","descriptor_name":"Natural Language Processing","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012660","descriptor_name":"Semantics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012660","descriptor_name":"Semantics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D035843","descriptor_name":"Biomedical Research","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D035843","descriptor_name":"Biomedical Research","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D035843","descriptor_name":"Biomedical Research","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D057225","descriptor_name":"Data Mining","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D057225","descriptor_name":"Data Mining","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D057225","descriptor_name":"Data Mining","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D057225","descriptor_name":"Data Mining","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D057225","descriptor_name":"Data Mining","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D066264","descriptor_name":"Datasets as Topic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D066264","descriptor_name":"Datasets as Topic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D066264","descriptor_name":"Datasets as Topic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":2,"locations":[{"id":"doi:10.1109/tcbb.2024.3429234","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcbb.2024.3429234","pdf_url":null,"source":{"id":"https://openalex.org/S36029991","display_name":"IEEE/ACM Transactions on Computational Biology and Bioinformatics","issn_l":"1545-5963","issn":["1545-5963","1557-9964","2374-0043"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Computational Biology and Bioinformatics","raw_type":"journal-article"},{"id":"pmid:39012749","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/39012749","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM transactions on computational biology and bioinformatics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W2047782770","https://openalex.org/W2057974478","https://openalex.org/W2071879021","https://openalex.org/W2095444228","https://openalex.org/W2100627415","https://openalex.org/W2149369282","https://openalex.org/W2154142897","https://openalex.org/W2159580878","https://openalex.org/W2163107094","https://openalex.org/W2169099542","https://openalex.org/W2346452181","https://openalex.org/W2399851972","https://openalex.org/W2769387903","https://openalex.org/W2779457220","https://openalex.org/W2889607075","https://openalex.org/W2911489562","https://openalex.org/W2938568946","https://openalex.org/W2948614377","https://openalex.org/W2949176808","https://openalex.org/W2950021574","https://openalex.org/W2952744660","https://openalex.org/W2964054038","https://openalex.org/W2970771982","https://openalex.org/W3034732033","https://openalex.org/W3037063616","https://openalex.org/W3046375318","https://openalex.org/W3048238778","https://openalex.org/W3083429640","https://openalex.org/W3090469165","https://openalex.org/W3104578551","https://openalex.org/W3125468681","https://openalex.org/W3137401156","https://openalex.org/W3166593409","https://openalex.org/W3207942231","https://openalex.org/W4210504333","https://openalex.org/W6748743896"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2118717649","https://openalex.org/W2413243053","https://openalex.org/W410723623","https://openalex.org/W2015341305","https://openalex.org/W2035068594","https://openalex.org/W4225593417","https://openalex.org/W2033914206","https://openalex.org/W2042327336"],"abstract_inverted_index":{"One":[0],"of":[1,9,15],"the":[2,6,13,82,152],"primary":[3],"tasks":[4],"in":[5,60,79],"early":[7],"stages":[8],"data":[10,34],"mining":[11],"involves":[12],"identification":[14],"entities":[16,112],"from":[17,31,71],"biomedical":[18,80,108],"corpora.":[19],"Traditional":[20],"approaches":[21],"relying":[22],"on":[23,105,132,135,138,141,144,147,151],"robust":[24],"feature":[25],"engineering":[26],"face":[27],"challenges":[28,78],"when":[29],"learning":[30,49],"available":[32],"(un-)annotated":[33],"using":[35],"data-driven":[36],"models":[37],"like":[38],"deep":[39,48],"learning-based":[40],"architectures.":[41],"Despite":[42],"leveraging":[43],"large":[44],"corpora":[45],"and":[46,65,68,85,94,118,149],"advanced":[47],"models,":[50,126],"domain":[51,109],"generalization":[52],"remains":[53],"an":[54],"issue.":[55],"Attention":[56,87],"mechanisms":[57],"are":[58],"effective":[59],"capturing":[61],"longer":[62],"sentence":[63],"dependencies":[64],"extracting":[66],"semantic":[67],"syntactic":[69],"information":[70],"limited":[72],"annotated":[73],"datasets.":[74],"To":[75],"address":[76],"out-of-vocabulary":[77],"text,":[81],"PCA-CLS":[83,121],"(Position":[84],"Contextual":[86],"with":[88],"CNN-LSTM-Softmax)":[89],"model":[90,122],"combines":[91],"global":[92],"self-attention":[93],"character-level":[95],"convolutional":[96],"neural":[97],"network":[98],"techniques.":[99],"The":[100,120],"model's":[101],"performance":[102],"is":[103],"evaluated":[104],"eight":[106],"distinct":[107],"datasets":[110],"encompassing":[111],"such":[113],"as":[114],"genes,":[115],"drugs,":[116],"diseases,":[117],"species.":[119],"outperforms":[123],"several":[124],"state-of-the-art":[125],"achieving":[127],"notable":[128],"F-scores,":[129],"including":[130],"88.19%":[131],"BC2GM,":[133],"85.44%":[134],"JNLPBA,":[136],"90.80%":[137],"BC5CDR-chemical,":[139],"87.07%":[140],"BC5CDR-disease,":[142],"89.18%":[143],"BC4CHEMD,":[145],"88.81%":[146],"NCBI,":[148],"91.59%":[150],"s800":[153],"dataset.":[154]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2025-10-10T00:00:00"}
