{"id":"https://openalex.org/W3081664523","doi":"https://doi.org/10.2478/jdis-2021-0013","title":"Automatic Keyphrase Extraction from Scientific Chinese Medical Abstracts Based on Character-Level Sequence Labeling","display_name":"Automatic Keyphrase Extraction from Scientific Chinese Medical Abstracts Based on Character-Level Sequence Labeling","publication_year":2021,"publication_date":"2021-03-02","ids":{"openalex":"https://openalex.org/W3081664523","doi":"https://doi.org/10.2478/jdis-2021-0013","mag":"3081664523"},"language":"en","primary_location":{"id":"doi:10.2478/jdis-2021-0013","is_oa":true,"landing_page_url":"https://doi.org/10.2478/jdis-2021-0013","pdf_url":"https://sciendo.com/pdf/10.2478/jdis-2021-0013","source":{"id":"https://openalex.org/S2764801193","display_name":"Journal of Data and Information Science","issn_l":"2096-157X","issn":["2096-157X","2543-683X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311940","host_organization_name":"Chinese Academy of Sciences","host_organization_lineage":["https://openalex.org/P4310311940"],"host_organization_lineage_names":["Chinese Academy of Sciences"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Data and Information Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://sciendo.com/pdf/10.2478/jdis-2021-0013","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5068494448","display_name":"Liangping Ding","orcid":"https://orcid.org/0000-0001-6832-4114"},"institutions":[{"id":"https://openalex.org/I4210148850","display_name":"National Science Library","ror":"https://ror.org/04ndjyr10","country_code":"CN","type":"archive","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210148850"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Liangping Ding","raw_affiliation_strings":["National Science Library, Chinese Academy of Sciences , Beijing , China","University of Chinese academy of sciences , Beijing , China","University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Science Library, Chinese Academy of Sciences , Beijing , China","institution_ids":["https://openalex.org/I4210148850"]},{"raw_affiliation_string":"University of Chinese academy of sciences , Beijing , China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101598836","display_name":"Zhixiong Zhang","orcid":"https://orcid.org/0000-0003-1596-7487"},"institutions":[{"id":"https://openalex.org/I4210148850","display_name":"National Science Library","ror":"https://ror.org/04ndjyr10","country_code":"CN","type":"archive","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210148850"]},{"id":"https://openalex.org/I4210134970","display_name":"Wuhan Branch of the National Science Library","ror":"https://ror.org/046n0zq43","country_code":"CN","type":"archive","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210134970","https://openalex.org/I4210148850"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhixiong Zhang","raw_affiliation_strings":["National Science Library, Chinese Academy of Sciences , Beijing , China","University of Chinese academy of sciences , Beijing , China","Wuhan Library, Chinese Academy of Sciences , Wuhan , China"],"affiliations":[{"raw_affiliation_string":"National Science Library, Chinese Academy of Sciences , Beijing , China","institution_ids":["https://openalex.org/I4210148850"]},{"raw_affiliation_string":"University of Chinese academy of sciences , Beijing , China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"Wuhan Library, Chinese Academy of Sciences , Wuhan , China","institution_ids":["https://openalex.org/I4210134970"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100338872","display_name":"Huan Liu","orcid":"https://orcid.org/0000-0001-5929-4400"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210148850","display_name":"National Science Library","ror":"https://ror.org/04ndjyr10","country_code":"CN","type":"archive","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210148850"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huan Liu","raw_affiliation_strings":["National Science Library, Chinese Academy of Sciences , Beijing , China","University of Chinese academy of sciences , Beijing , China","University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Science Library, Chinese Academy of Sciences , Beijing , China","institution_ids":["https://openalex.org/I4210148850"]},{"raw_affiliation_string":"University of Chinese academy of sciences , Beijing , China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100428364","display_name":"Jie Li","orcid":"https://orcid.org/0009-0003-0046-5596"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210148850","display_name":"National Science Library","ror":"https://ror.org/04ndjyr10","country_code":"CN","type":"archive","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210148850"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Li","raw_affiliation_strings":["National Science Library, Chinese Academy of Sciences , Beijing , China","University of Chinese academy of sciences , Beijing , China","University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Science Library, Chinese Academy of Sciences , Beijing , China","institution_ids":["https://openalex.org/I4210148850"]},{"raw_affiliation_string":"University of Chinese academy of sciences , Beijing , China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056564450","display_name":"Gaihong Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210148850","display_name":"National Science Library","ror":"https://ror.org/04ndjyr10","country_code":"CN","type":"archive","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210148850"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gaihong Yu","raw_affiliation_strings":["National Science Library, Chinese Academy of Sciences , Beijing , China","University of Chinese academy of sciences , Beijing , China","University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Science Library, Chinese Academy of Sciences , Beijing , China","institution_ids":["https://openalex.org/I4210148850"]},{"raw_affiliation_string":"University of Chinese academy of sciences , Beijing , China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5068494448"],"corresponding_institution_ids":["https://openalex.org/I4210148850","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.136,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.50008688,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":93},"biblio":{"volume":"6","issue":"3","first_page":"35","last_page":"57"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/character","display_name":"Character (mathematics)","score":0.7250033617019653},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6690764427185059},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.5715146064758301},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5576140880584717},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5197774767875671},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.4002227187156677},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.16076555848121643},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.08753606677055359},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.07892420887947083},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.07636821269989014}],"concepts":[{"id":"https://openalex.org/C2780861071","wikidata":"https://www.wikidata.org/wiki/Q1062934","display_name":"Character (mathematics)","level":2,"score":0.7250033617019653},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6690764427185059},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.5715146064758301},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5576140880584717},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5197774767875671},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.4002227187156677},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.16076555848121643},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.08753606677055359},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.07892420887947083},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.07636821269989014},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.2478/jdis-2021-0013","is_oa":true,"landing_page_url":"https://doi.org/10.2478/jdis-2021-0013","pdf_url":"https://sciendo.com/pdf/10.2478/jdis-2021-0013","source":{"id":"https://openalex.org/S2764801193","display_name":"Journal of Data and Information Science","issn_l":"2096-157X","issn":["2096-157X","2543-683X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311940","host_organization_name":"Chinese Academy of Sciences","host_organization_lineage":["https://openalex.org/P4310311940"],"host_organization_lineage_names":["Chinese Academy of Sciences"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Data and Information Science","raw_type":"journal-article"},{"id":"pmh:oai:pure.atira.dk:openaire_cris_publications/77a3134a-c895-430a-9d4c-fd6b1f56a3e0","is_oa":true,"landing_page_url":"https://research.manchester.ac.uk/en/publications/77a3134a-c895-430a-9d4c-fd6b1f56a3e0","pdf_url":null,"source":{"id":"https://openalex.org/S4306400662","display_name":"Research Explorer (The University of Manchester)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I28407311","host_organization_name":"University of Manchester","host_organization_lineage":["https://openalex.org/I28407311"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Ding, L, Zhang, Z, Liu, H, Li, J & Yu, G 2021, 'Automatic Keyphrase Extraction from Scientific Chinese Medical Abstracts Based on Character-Level Sequence Labeling', Journal of Data and Information Science, vol. 6, no. 3, pp. 35-57. https://doi.org/10.2478/jdis-2021-0013","raw_type":"article"},{"id":"mag:3081664523","is_oa":false,"landing_page_url":"http://ceur-ws.org/Vol-2658/paper3.pdf","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":null}],"best_oa_location":{"id":"doi:10.2478/jdis-2021-0013","is_oa":true,"landing_page_url":"https://doi.org/10.2478/jdis-2021-0013","pdf_url":"https://sciendo.com/pdf/10.2478/jdis-2021-0013","source":{"id":"https://openalex.org/S2764801193","display_name":"Journal of Data and Information Science","issn_l":"2096-157X","issn":["2096-157X","2543-683X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311940","host_organization_name":"Chinese Academy of Sciences","host_organization_lineage":["https://openalex.org/P4310311940"],"host_organization_lineage_names":["Chinese Academy of Sciences"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Data and Information Science","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321133","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3081664523.pdf","grobid_xml":"https://content.openalex.org/works/W3081664523.grobid-xml"},"referenced_works_count":55,"referenced_works":["https://openalex.org/W32253530","https://openalex.org/W1479777983","https://openalex.org/W1544240449","https://openalex.org/W1907578970","https://openalex.org/W1971947061","https://openalex.org/W1975432235","https://openalex.org/W1978394996","https://openalex.org/W1985697096","https://openalex.org/W2011399892","https://openalex.org/W2030903088","https://openalex.org/W2045181608","https://openalex.org/W2058089741","https://openalex.org/W2061118645","https://openalex.org/W2064418625","https://openalex.org/W2071940869","https://openalex.org/W2102733276","https://openalex.org/W2105745072","https://openalex.org/W2110693578","https://openalex.org/W2110798204","https://openalex.org/W2136075087","https://openalex.org/W2136922672","https://openalex.org/W2141222516","https://openalex.org/W2145049651","https://openalex.org/W2145766604","https://openalex.org/W2158018156","https://openalex.org/W2163659824","https://openalex.org/W2167329753","https://openalex.org/W2250589143","https://openalex.org/W2250954789","https://openalex.org/W2251295945","https://openalex.org/W2251476947","https://openalex.org/W2525778437","https://openalex.org/W2526059794","https://openalex.org/W2559152380","https://openalex.org/W2566480286","https://openalex.org/W2734608416","https://openalex.org/W2789995212","https://openalex.org/W2896457183","https://openalex.org/W2911489562","https://openalex.org/W2949176808","https://openalex.org/W2962739339","https://openalex.org/W2962903510","https://openalex.org/W2963026768","https://openalex.org/W2963339489","https://openalex.org/W3010180081","https://openalex.org/W3015316465","https://openalex.org/W4255165398","https://openalex.org/W6601685744","https://openalex.org/W6631501603","https://openalex.org/W6638437678","https://openalex.org/W6639689704","https://openalex.org/W6685063089","https://openalex.org/W6685158001","https://openalex.org/W6739901393","https://openalex.org/W6762088049"],"related_works":["https://openalex.org/W3136166618","https://openalex.org/W1571048958","https://openalex.org/W2407602213","https://openalex.org/W2175961425","https://openalex.org/W2579421788","https://openalex.org/W2775202391","https://openalex.org/W2991906656","https://openalex.org/W2568161442","https://openalex.org/W2501258963","https://openalex.org/W3135010642","https://openalex.org/W2159746967","https://openalex.org/W3033005197","https://openalex.org/W3080344931","https://openalex.org/W31525886","https://openalex.org/W2578248109","https://openalex.org/W2541677038","https://openalex.org/W2915224552","https://openalex.org/W2030903088","https://openalex.org/W2842548026","https://openalex.org/W2807440203"],"abstract_inverted_index":{"Abstract":[0],"Purpose":[1],"Automatic":[2,250],"keyphrase":[3,39,119,205,210,290,320],"extraction":[4,40,120,206,291,321],"(AKE)":[5],"is":[6,231,268,284],"an":[7,37],"important":[8],"task":[9,58,207,292],"for":[10,42,234,261,287,309],"grasping":[11],"the":[12,16,25,173,220,262,294,315],"main":[13],"points":[14],"of":[15,27,63,180,193,248,264,297,317],"text.":[17],"In":[18,226],"this":[19],"paper,":[20],"we":[21],"aim":[22],"to":[23,35,59,152,322],"combine":[24],"benefits":[26,263],"sequence":[28,56,157,184],"labeling":[29,57,158,185],"formulation":[30,283],"and":[31,66,90,110,128,145,155,165,312],"pretrained":[32,71,298],"language":[33,72,299],"model":[34,41,69,73,176,186,310],"propose":[36],"automatic":[38,204,289,319],"Chinese":[43,51,64,86,249,255,288,318],"scientific":[44,254],"research.":[45],"Design/methodology/approach":[46],"We":[47,82,116,201,241],"regard":[48],"AKE":[49],"from":[50,85,95,253],"text":[52,222],"as":[53,102,107,113,147],"a":[54,92,306],"character-level":[55,156,171,183,244,282],"avoid":[60],"segmentation":[61],"errors":[62],"tokenizer":[65],"initialize":[67],"our":[68,182,228,243,278,302],"with":[70,170,177,236],"BERT,":[74],"which":[75,98,267],"was":[76],"released":[77],"by":[78],"Google":[79],"in":[80,219],"2018.":[81],"collect":[83],"data":[84],"Science":[87],"Citation":[88],"Database":[89],"construct":[91],"large-scale":[93],"dataset":[94,230,247,304],"medical":[96,256],"domain,":[97],"contains":[99],"100,000":[100],"abstracts":[101,106,112,257],"training":[103],"set,":[104],"6,000":[105],"development":[108,316],"set":[109],"3,094":[111],"test":[114],"set.":[115],"use":[117],"unsupervised":[118],"methods":[121,132],"including":[122,133],"term":[123],"frequency":[124],"(TF),":[125],"TF-IDF,":[126],"TextRank":[127],"supervised":[129,161],"machine":[130,162],"learning":[131,163],"Conditional":[134],"Random":[135],"Field":[136],"(CRF),":[137],"Bidirectional":[138],"Long":[139],"Short":[140],"Term":[141],"Memory":[142],"Network":[143],"(BiLSTM),":[144],"BiLSTM-CRF":[146],"baselines.":[148],"Experiments":[149],"are":[150,217],"designed":[151],"compare":[153],"word-level":[154],"approaches":[159],"on":[160,188],"models":[164],"BERT-based":[166],"models.":[167,300],"Findings":[168],"Compared":[169],"BiLSTM-CRF,":[172],"best":[174],"baseline":[175],"F1":[178,191],"score":[179,192],"50.16%,":[181],"based":[187],"BERT":[189],"obtains":[190],"59.80%,":[194],"getting":[195],"9.64%":[196],"absolute":[197],"improvement.":[198],"Research":[199],"limitations":[200],"just":[202],"consider":[203],"rather":[208],"than":[209],"generation":[211],"task,":[212],"so":[213],"only":[214],"keyphrases":[215],"that":[216,281],"occurred":[218],"given":[221],"can":[223,313],"be":[224],"extracted.":[225],"addition,":[227],"proposed":[229,303],"not":[232],"suitable":[233,286],"dealing":[235],"nested":[237],"keyphrases.":[238],"Practical":[239],"implications":[240],"make":[242],"IOB":[245],"format":[246],"Keyphrase":[251],"Extraction":[252],"(CAKE)":[258],"publicly":[259],"available":[260,269],"research":[265],"community,":[266],"at:":[270],"https://github.com/possible1402/Dataset-For-Chinese-Medical-Keyphrase-Extraction":[271],".":[272],"Originality/value":[273],"By":[274],"designing":[275],"comparative":[276],"experiments,":[277],"study":[279],"demonstrates":[280],"more":[285],"under":[293],"general":[295],"trend":[296],"And":[301],"provides":[305],"unified":[307],"method":[308],"evaluation":[311],"promote":[314],"some":[323],"extent.":[324]},"counts_by_year":[{"year":2021,"cited_by_count":1}],"updated_date":"2026-01-23T23:20:30.427331","created_date":"2025-10-10T00:00:00"}
