{"id":"https://openalex.org/W4220815098","doi":"https://doi.org/10.1109/tcbb.2022.3157630","title":"Noise Reduction Learning Based on XLNet-CRF for Biomedical Named Entity Recognition","display_name":"Noise Reduction Learning Based on XLNet-CRF for Biomedical Named Entity Recognition","publication_year":2022,"publication_date":"2022-03-08","ids":{"openalex":"https://openalex.org/W4220815098","doi":"https://doi.org/10.1109/tcbb.2022.3157630","pmid":"https://pubmed.ncbi.nlm.nih.gov/35259113"},"language":"en","primary_location":{"id":"doi:10.1109/tcbb.2022.3157630","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcbb.2022.3157630","pdf_url":null,"source":{"id":"https://openalex.org/S36029991","display_name":"IEEE/ACM Transactions on Computational Biology and Bioinformatics","issn_l":"1545-5963","issn":["1545-5963","1557-9964","2374-0043"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Computational Biology and Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Zhaoying Chai","orcid":"https://orcid.org/0000-0003-3131-1285"},"institutions":[{"id":"https://openalex.org/I75390827","display_name":"Beijing University of Chemical Technology","ror":"https://ror.org/00df5yc52","country_code":"CN","type":"education","lineage":["https://openalex.org/I75390827"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhaoying Chai","raw_affiliation_strings":["College of Information Science and Technology, Beijing University of Chemical Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"College of Information Science and Technology, Beijing University of Chemical Technology, Beijing, China","institution_ids":["https://openalex.org/I75390827"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Han Jin","orcid":null},"institutions":[{"id":"https://openalex.org/I75390827","display_name":"Beijing University of Chemical Technology","ror":"https://ror.org/00df5yc52","country_code":"CN","type":"education","lineage":["https://openalex.org/I75390827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Han Jin","raw_affiliation_strings":["College of Information Science and Technology, Beijing University of Chemical Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"College of Information Science and Technology, Beijing University of Chemical Technology, Beijing, China","institution_ids":["https://openalex.org/I75390827"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Shenghui Shi","orcid":"https://orcid.org/0000-0001-5746-3012"},"institutions":[{"id":"https://openalex.org/I75390827","display_name":"Beijing University of Chemical Technology","ror":"https://ror.org/00df5yc52","country_code":"CN","type":"education","lineage":["https://openalex.org/I75390827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shenghui Shi","raw_affiliation_strings":["College of Information Science and Technology, Beijing University of Chemical Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"College of Information Science and Technology, Beijing University of Chemical Technology, Beijing, China","institution_ids":["https://openalex.org/I75390827"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Siyan Zhan","orcid":"https://orcid.org/0000-0001-7252-5349"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siyan Zhan","raw_affiliation_strings":["School of Public Health, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Public Health, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Lin Zhuo","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4210141942","display_name":"Peking University Third Hospital","ror":"https://ror.org/04wwqze12","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210141942"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lin Zhuo","raw_affiliation_strings":["Research Center of Clinical Epidemiology, Peking University Third Hospital, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Research Center of Clinical Epidemiology, Peking University Third Hospital, Beijing, China","institution_ids":["https://openalex.org/I20231570","https://openalex.org/I4210141942"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yu Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210096250","display_name":"Beijing Institute of Big Data Research","ror":"https://ror.org/00s1sz824","country_code":"CN","type":"facility","lineage":["https://openalex.org/I20231570","https://openalex.org/I37796252","https://openalex.org/I4210096250"]},{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yu Yang","raw_affiliation_strings":["National institute of health data science, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National institute of health data science, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570","https://openalex.org/I4210096250"]}]},{"author_position":"last","author":{"id":null,"display_name":"Qi Lian","orcid":null},"institutions":[{"id":"https://openalex.org/I165143802","display_name":"University of Queensland","ror":"https://ror.org/00rqy9422","country_code":"AU","type":"education","lineage":["https://openalex.org/I165143802"]},{"id":"https://openalex.org/I160993911","display_name":"Queensland University of Technology","ror":"https://ror.org/03pnv4752","country_code":"AU","type":"education","lineage":["https://openalex.org/I160993911"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Qi Lian","raw_affiliation_strings":["Information Technology and Electrical Engineering, The University of Queensland, Brisbane, Australia"],"affiliations":[{"raw_affiliation_string":"Information Technology and Electrical Engineering, The University of Queensland, Brisbane, Australia","institution_ids":["https://openalex.org/I160993911","https://openalex.org/I165143802"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I75390827"],"apc_list":null,"apc_paid":null,"fwci":1.5163,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.84867385,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"20","issue":"1","first_page":"595","last_page":"605"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.711899995803833,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.711899995803833,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.18199999630451202,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.024299999698996544,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/named-entity-recognition","display_name":"Named-entity recognition","score":0.722000002861023},{"id":"https://openalex.org/keywords/conditional-random-field","display_name":"Conditional random field","score":0.6728000044822693},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.5554999709129333},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4796999990940094},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4564000070095062},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4311999976634979},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4090999960899353},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4043000042438507},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.4034999907016754}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7879999876022339},{"id":"https://openalex.org/C2779135771","wikidata":"https://www.wikidata.org/wiki/Q403574","display_name":"Named-entity recognition","level":3,"score":0.722000002861023},{"id":"https://openalex.org/C152565575","wikidata":"https://www.wikidata.org/wiki/Q1124538","display_name":"Conditional random field","level":2,"score":0.6728000044822693},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6086999773979187},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.5554999709129333},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4796999990940094},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.460099995136261},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4564000070095062},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4311999976634979},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4090999960899353},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4043000042438507},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.4034999907016754},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.38929998874664307},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3531000018119812},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3504999876022339},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.33959999680519104},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3382999897003174},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.33570000529289246},{"id":"https://openalex.org/C2778012447","wikidata":"https://www.wikidata.org/wiki/Q1034415","display_name":"Scope (computer science)","level":2,"score":0.3321000039577484},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.31310001015663147},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.3095000088214874},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.29120001196861267},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.2879999876022339},{"id":"https://openalex.org/C21308566","wikidata":"https://www.wikidata.org/wiki/Q7169365","display_name":"Permutation (music)","level":2,"score":0.27950000762939453},{"id":"https://openalex.org/C150921843","wikidata":"https://www.wikidata.org/wiki/Q1170431","display_name":"Resampling","level":2,"score":0.27619999647140503},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.27399998903274536},{"id":"https://openalex.org/C2781170535","wikidata":"https://www.wikidata.org/wiki/Q30587856","display_name":"Noisy data","level":2,"score":0.2712000012397766},{"id":"https://openalex.org/C29265498","wikidata":"https://www.wikidata.org/wiki/Q7047719","display_name":"Noise measurement","level":3,"score":0.2648000121116638},{"id":"https://openalex.org/C200985842","wikidata":"https://www.wikidata.org/wiki/Q3375503","display_name":"Random permutation","level":3,"score":0.2644999921321869}],"mesh":[{"descriptor_ui":"D007802","descriptor_name":"Language","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D007802","descriptor_name":"Language","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D007802","descriptor_name":"Language","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1109/tcbb.2022.3157630","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcbb.2022.3157630","pdf_url":null,"source":{"id":"https://openalex.org/S36029991","display_name":"IEEE/ACM Transactions on Computational Biology and Bioinformatics","issn_l":"1545-5963","issn":["1545-5963","1557-9964","2374-0043"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Computational Biology and Bioinformatics","raw_type":"journal-article"},{"id":"pmid:35259113","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/35259113","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM transactions on computational biology and bioinformatics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W1964670939","https://openalex.org/W2047782770","https://openalex.org/W2057974478","https://openalex.org/W2100627415","https://openalex.org/W2145386458","https://openalex.org/W2149369282","https://openalex.org/W2154142897","https://openalex.org/W2161853863","https://openalex.org/W2169099542","https://openalex.org/W2176996276","https://openalex.org/W2283140239","https://openalex.org/W2296283641","https://openalex.org/W2346452181","https://openalex.org/W2537623931","https://openalex.org/W2734608416","https://openalex.org/W2743028754","https://openalex.org/W2768488789","https://openalex.org/W2769387903","https://openalex.org/W2779457220","https://openalex.org/W2889607075","https://openalex.org/W2890830728","https://openalex.org/W2896457183","https://openalex.org/W2911489562","https://openalex.org/W2963250244","https://openalex.org/W2963339489","https://openalex.org/W2995602767","https://openalex.org/W3004047707","https://openalex.org/W3024305464","https://openalex.org/W3043710593","https://openalex.org/W3048238778","https://openalex.org/W3090469165","https://openalex.org/W3097717858","https://openalex.org/W3107083523","https://openalex.org/W3157876196","https://openalex.org/W3161231563","https://openalex.org/W3175873000","https://openalex.org/W3186054896","https://openalex.org/W6604173257","https://openalex.org/W6727690538","https://openalex.org/W6736175030","https://openalex.org/W6739901393","https://openalex.org/W6763701032","https://openalex.org/W6767434342"],"related_works":[],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"Biomedical":[3],"Named":[4],"Entity":[5],"Recognition":[6],"(BioNER)":[7],"systems":[8],"have":[9,37,68],"mainly":[10],"been":[11,39],"based":[12,34,91],"on":[13,35,92,134],"deep":[14],"neural":[15],"networks,":[16],"which":[17,95],"are":[18],"used":[19],"to":[20,165],"extract":[21],"information":[22],"from":[23],"the":[24,51,117,121,141,144,148,151,158,162],"rapidly":[25],"expanding":[26],"biomedical":[27,112],"literature.":[28],"Long-distance":[29],"context":[30],"autoencoding":[31],"language":[32,99],"models":[33,67,119,146,163],"transformers":[36],"recently":[38],"employed":[40],"for":[41,63,75],"BioNER":[42],"with":[43],"great":[44],"success.":[45],"However,":[46],"noise":[47,83],"interference":[48],"exists":[49],"in":[50,71],"process":[52],"of":[53,73,82,136,143,150,154,161],"pre-training":[54,100],"and":[55,57,88,102,126,129,147,156],"fine-tuning,":[56],"there":[58],"is":[59,96],"no":[60],"effective":[61],"decoder":[62],"label":[64],"dependency.":[65],"Current":[66],"many":[69],"aspects":[70],"need":[72],"improvement":[74,149],"better":[76],"performance.":[77],"We":[78],"propose":[79],"two":[80,118,145],"kinds":[81],"reduction":[84],"models,":[85],"Shared":[86],"Labels":[87],"Dynamic":[89],"Splicing,":[90],"XLNet":[93],"encoding":[94],"a":[97],"permutation":[98],"model":[101],"decoding":[103],"by":[104,124],"Conditional":[105],"Random":[106],"Field":[107],"(CRF).":[108],"By":[109],"testing":[110],"15":[111],"named":[113],"entity":[114],"recognition":[115,152],"datasets,":[116],"improved":[120],"average":[122],"F1-score":[123],"1.504":[125],"1.48,":[127],"respectively,":[128],"state-of-the-art":[130],"performance":[131],"was":[132],"achieved":[133],"7":[135],"them.":[137],"Further":[138],"analysis":[139],"proves":[140],"effectiveness":[142],"effect":[153],"CRF,":[155],"suggests":[157],"applicable":[159],"scope":[160],"according":[164],"different":[166],"data":[167],"characteristics.":[168]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":7}],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2022-04-03T00:00:00"}
