{"id":"https://openalex.org/W2017675085","doi":"https://doi.org/10.1145/2665970.2665990","title":"Biomedical Named Entity Recognition Based on the Combination of Regional and Global Text Features","display_name":"Biomedical Named Entity Recognition Based on the Combination of Regional and Global Text Features","publication_year":2014,"publication_date":"2014-11-03","ids":{"openalex":"https://openalex.org/W2017675085","doi":"https://doi.org/10.1145/2665970.2665990","mag":"2017675085"},"language":"en","primary_location":{"id":"doi:10.1145/2665970.2665990","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2665970.2665990","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM 8th International Workshop on Data and Text Mining in Bioinformatics","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5029511687","display_name":"Yoo Kyung Jeong","orcid":"https://orcid.org/0000-0002-6571-6478"},"institutions":[{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Yoo Kyung Jeong","raw_affiliation_strings":["Department of Library and Information Science, Yonsei University, Seoul, South Korea","(Department of Library and Information Science, Yonsei University, Seoul, South Korea)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Library and Information Science, Yonsei University, Seoul, South Korea","institution_ids":["https://openalex.org/I193775966"]},{"raw_affiliation_string":"(Department of Library and Information Science, Yonsei University, Seoul, South Korea)","institution_ids":["https://openalex.org/I193775966"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109475683","display_name":"Da-Hee Lee","orcid":null},"institutions":[{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Dahee Lee","raw_affiliation_strings":["Department of Library and Information Science, Yonsei University, Seoul, South Korea","(Department of Library and Information Science, Yonsei University, Seoul, South Korea)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Library and Information Science, Yonsei University, Seoul, South Korea","institution_ids":["https://openalex.org/I193775966"]},{"raw_affiliation_string":"(Department of Library and Information Science, Yonsei University, Seoul, South Korea)","institution_ids":["https://openalex.org/I193775966"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087793573","display_name":"Namgi Han","orcid":null},"institutions":[{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Nam-Gi Han","raw_affiliation_strings":["Department of Library and Information Science, Yonsei University, Seoul, South Korea","(Department of Library and Information Science, Yonsei University, Seoul, South Korea)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Library and Information Science, Yonsei University, Seoul, South Korea","institution_ids":["https://openalex.org/I193775966"]},{"raw_affiliation_string":"(Department of Library and Information Science, Yonsei University, Seoul, South Korea)","institution_ids":["https://openalex.org/I193775966"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047395571","display_name":"Won Chul Kim","orcid":"https://orcid.org/0000-0002-5925-6647"},"institutions":[{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Won Chul Kim","raw_affiliation_strings":["Department of Library and Information Science, Yonsei University, Seoul, South Korea","(Department of Library and Information Science, Yonsei University, Seoul, South Korea)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Library and Information Science, Yonsei University, Seoul, South Korea","institution_ids":["https://openalex.org/I193775966"]},{"raw_affiliation_string":"(Department of Library and Information Science, Yonsei University, Seoul, South Korea)","institution_ids":["https://openalex.org/I193775966"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5045749444","display_name":"Min Song","orcid":"https://orcid.org/0000-0003-3255-1600"},"institutions":[{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Min Song","raw_affiliation_strings":["Department of Library and Information Science, Yonsei University, Seoul, South Korea","(Department of Library and Information Science, Yonsei University, Seoul, South Korea)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Library and Information Science, Yonsei University, Seoul, South Korea","institution_ids":["https://openalex.org/I193775966"]},{"raw_affiliation_string":"(Department of Library and Information Science, Yonsei University, Seoul, South Korea)","institution_ids":["https://openalex.org/I193775966"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0780842,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"5","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/conditional-random-field","display_name":"Conditional random field","score":0.870207667350769},{"id":"https://openalex.org/keywords/named-entity-recognition","display_name":"Named-entity recognition","score":0.8664629459381104},{"id":"https://openalex.org/keywords/biomedical-text-mining","display_name":"Biomedical text mining","score":0.8152894973754883},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.813388466835022},{"id":"https://openalex.org/keywords/crfs","display_name":"CRFS","score":0.8003394603729248},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.7380618453025818},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.7120914459228516},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7109789848327637},{"id":"https://openalex.org/keywords/entity-linking","display_name":"Entity linking","score":0.6193215250968933},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.5504924058914185},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5279989242553711},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4920057952404022},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.4767005145549774},{"id":"https://openalex.org/keywords/feature-engineering","display_name":"Feature engineering","score":0.4480922818183899},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4407499134540558},{"id":"https://openalex.org/keywords/pipeline-transport","display_name":"Pipeline transport","score":0.43186846375465393},{"id":"https://openalex.org/keywords/text-mining","display_name":"Text mining","score":0.33949971199035645},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.2632777690887451},{"id":"https://openalex.org/keywords/knowledge-base","display_name":"Knowledge base","score":0.2141985297203064},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.13442927598953247},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08336472511291504}],"concepts":[{"id":"https://openalex.org/C152565575","wikidata":"https://www.wikidata.org/wiki/Q1124538","display_name":"Conditional random field","level":2,"score":0.870207667350769},{"id":"https://openalex.org/C2779135771","wikidata":"https://www.wikidata.org/wiki/Q403574","display_name":"Named-entity recognition","level":3,"score":0.8664629459381104},{"id":"https://openalex.org/C165141518","wikidata":"https://www.wikidata.org/wiki/Q4915126","display_name":"Biomedical text mining","level":3,"score":0.8152894973754883},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.813388466835022},{"id":"https://openalex.org/C2775953691","wikidata":"https://www.wikidata.org/wiki/Q5013874","display_name":"CRFS","level":3,"score":0.8003394603729248},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.7380618453025818},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.7120914459228516},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7109789848327637},{"id":"https://openalex.org/C96711827","wikidata":"https://www.wikidata.org/wiki/Q17012245","display_name":"Entity linking","level":3,"score":0.6193215250968933},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.5504924058914185},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5279989242553711},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4920057952404022},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4767005145549774},{"id":"https://openalex.org/C2778827112","wikidata":"https://www.wikidata.org/wiki/Q22245680","display_name":"Feature engineering","level":3,"score":0.4480922818183899},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4407499134540558},{"id":"https://openalex.org/C175309249","wikidata":"https://www.wikidata.org/wiki/Q725864","display_name":"Pipeline transport","level":2,"score":0.43186846375465393},{"id":"https://openalex.org/C71472368","wikidata":"https://www.wikidata.org/wiki/Q676880","display_name":"Text mining","level":2,"score":0.33949971199035645},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2632777690887451},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.2141985297203064},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.13442927598953247},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08336472511291504},{"id":"https://openalex.org/C87717796","wikidata":"https://www.wikidata.org/wiki/Q146326","display_name":"Environmental engineering","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2665970.2665990","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2665970.2665990","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM 8th International Workshop on Data and Text Mining in Bioinformatics","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6200000047683716,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G6889220993","display_name":null,"funder_award_id":"NRF-2013M3A9C4078138","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"}],"funders":[{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":2,"referenced_works":["https://openalex.org/W2048140075","https://openalex.org/W2147880316"],"related_works":["https://openalex.org/W2763026339","https://openalex.org/W2548624545","https://openalex.org/W2067424770","https://openalex.org/W189110383","https://openalex.org/W2398073356","https://openalex.org/W3087842898","https://openalex.org/W2027233318","https://openalex.org/W4250494529","https://openalex.org/W3185751515","https://openalex.org/W2937192905"],"abstract_inverted_index":{"The":[0],"biomedical":[1,14,25,47,163],"information":[2],"extraction,":[3],"especially":[4,88],"Named":[5],"Entity":[6],"Recognition":[7],"(NER),":[8],"is":[9],"a":[10,45,51,74,99,124,137],"primary":[11],"task":[12],"in":[13,98,117],"text-mining":[15],"due":[16],"to":[17,130,148,160,187],"the":[18,92,114,118,156,188,191],"rapid":[19],"growth":[20],"of":[21,53,80,127,133,139,150,190],"large-scale":[22],"literature.":[23],"Extracting":[24],"entities":[26,31],"aims":[27],"at":[28],"identifying":[29],"specific":[30],"(words":[32],"or":[33],"phrases)":[34],"from":[35,145],"those":[36],"unstructured":[37],"text":[38,57,96],"data.":[39],"In":[40],"this":[41],"work,":[42],"we":[43],"introduce":[44],"novel":[46],"NER":[48,164],"system":[49,66,122,143],"utilizing":[50],"combination":[52],"regional":[54],"and":[55,62,78,102,110,183],"global":[56],"features:":[58],"linguistic,":[59],"lexical,":[60],"contextual,":[61],"syntactic":[63],"features.":[64],"Our":[65],"adopts":[67],"Conditional":[68],"Random":[69],"Fields":[70],"(CRFs)":[71],"[1]":[72],"as":[73,153,155,177],"machine":[75],"learning":[76],"algorithm":[77],"consists":[79],"two":[81],"major":[82],"pipelines":[83],"(see":[84],"Figure":[85],"1).":[86],"We":[87,170],"focus":[89],"on":[90,166],"constructing":[91],"first":[93],"pipeline":[94],"for":[95],"processing":[97],"modularized":[100],"manner":[101],"discovering":[103],"rich":[104],"feature":[105,134,184],"sets":[106],"regarding":[107],"comprehensive":[108],"linguistics":[109],"contexts.":[111],"To":[112],"implement":[113],"CRF":[115],"framework":[116],"second":[119],"pipeline,":[120],"our":[121,142],"uses":[123],"modified":[125],"version":[126],"Mallet":[128],"[2]":[129],"take":[131],"advantage":[132],"induction.":[135],"As":[136],"result":[138],"10-fold":[140],"cross-validation,":[141],"achieves":[144],"0.99%":[146],"up":[147],"18.47%":[149],"F-measure":[151],"improvement":[152],"well":[154],"highest":[157],"precision":[158],"compared":[159],"existing":[161],"open-source":[162],"systems":[165],"GENETAG":[167],"corpus":[168],"[3].":[169],"figure":[171],"out":[172],"that":[173],"several":[174],"components":[175],"such":[176],"abundant":[178],"key":[179],"features,":[180],"external":[181],"resources,":[182],"induction":[185],"contribute":[186],"performance":[189],"proposed":[192],"system.":[193]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
