{"id":"https://openalex.org/W7118660496","doi":"https://doi.org/10.1186/s13326-025-00346-1","title":"Annotating and indexing scientific articles with rare diseases","display_name":"Annotating and indexing scientific articles with rare diseases","publication_year":2026,"publication_date":"2026-01-06","ids":{"openalex":"https://openalex.org/W7118660496","doi":"https://doi.org/10.1186/s13326-025-00346-1","pmid":"https://pubmed.ncbi.nlm.nih.gov/41495851"},"language":"en","primary_location":{"id":"doi:10.1186/s13326-025-00346-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13326-025-00346-1","pdf_url":null,"source":{"id":"https://openalex.org/S172276550","display_name":"Journal of Biomedical Semantics","issn_l":"2041-1480","issn":["2041-1480"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Biomedical Semantics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1186/s13326-025-00346-1","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004640276","display_name":"Hosein Azarbonyad","orcid":"https://orcid.org/0000-0003-0841-7516"},"institutions":[{"id":"https://openalex.org/I1318003438","display_name":"RELX Group (Netherlands)","ror":"https://ror.org/02scfj030","country_code":"NL","type":"company","lineage":["https://openalex.org/I1318003438","https://openalex.org/I4210160603"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Hosein Azarbonyad","raw_affiliation_strings":["Elsevier B.V., Amsterdam, Noord Holland, The Netherlands. h.azarbonyad@elsevier.com"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Elsevier B.V., Amsterdam, Noord Holland, The Netherlands. h.azarbonyad@elsevier.com","institution_ids":["https://openalex.org/I1318003438"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048053757","display_name":"Zubair Afzal","orcid":"https://orcid.org/0000-0001-7812-2399"},"institutions":[{"id":"https://openalex.org/I1318003438","display_name":"RELX Group (Netherlands)","ror":"https://ror.org/02scfj030","country_code":"NL","type":"company","lineage":["https://openalex.org/I1318003438","https://openalex.org/I4210160603"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Zubair Afzal","raw_affiliation_strings":["Elsevier B.V., Amsterdam, Noord Holland, The Netherlands"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Elsevier B.V., Amsterdam, Noord Holland, The Netherlands","institution_ids":["https://openalex.org/I1318003438"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122225763","display_name":"Rik Iping","orcid":null},"institutions":[{"id":"https://openalex.org/I2801952686","display_name":"Erasmus MC","ror":"https://ror.org/018906e22","country_code":"NL","type":"funder","lineage":["https://openalex.org/I2801952686"]},{"id":"https://openalex.org/I913958620","display_name":"Erasmus University Rotterdam","ror":"https://ror.org/057w15z03","country_code":"NL","type":"education","lineage":["https://openalex.org/I913958620"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Rik Iping","raw_affiliation_strings":["Erasmus MC, Rotterdam, Zuid Holland, The Netherlands"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Erasmus MC, Rotterdam, Zuid Holland, The Netherlands","institution_ids":["https://openalex.org/I913958620","https://openalex.org/I2801952686"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043767252","display_name":"M. DuMoulin","orcid":null},"institutions":[{"id":"https://openalex.org/I1318003438","display_name":"RELX Group (Netherlands)","ror":"https://ror.org/02scfj030","country_code":"NL","type":"company","lineage":["https://openalex.org/I1318003438","https://openalex.org/I4210160603"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Max Dumoulin","raw_affiliation_strings":["Elsevier B.V., Amsterdam, Noord Holland, The Netherlands"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Elsevier B.V., Amsterdam, Noord Holland, The Netherlands","institution_ids":["https://openalex.org/I1318003438"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122107269","display_name":"Ilse Nederveen","orcid":null},"institutions":[{"id":"https://openalex.org/I2801952686","display_name":"Erasmus MC","ror":"https://ror.org/018906e22","country_code":"NL","type":"funder","lineage":["https://openalex.org/I2801952686"]},{"id":"https://openalex.org/I913958620","display_name":"Erasmus University Rotterdam","ror":"https://ror.org/057w15z03","country_code":"NL","type":"education","lineage":["https://openalex.org/I913958620"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Ilse Nederveen","raw_affiliation_strings":["Erasmus MC, Rotterdam, Zuid Holland, The Netherlands"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Erasmus MC, Rotterdam, Zuid Holland, The Netherlands","institution_ids":["https://openalex.org/I913958620","https://openalex.org/I2801952686"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033442401","display_name":"Jiangtao Yu","orcid":"https://orcid.org/0000-0003-4883-7398"},"institutions":[{"id":"https://openalex.org/I1318003438","display_name":"RELX Group (Netherlands)","ror":"https://ror.org/02scfj030","country_code":"NL","type":"company","lineage":["https://openalex.org/I1318003438","https://openalex.org/I4210160603"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Jiangtao Yu","raw_affiliation_strings":["Elsevier B.V., Amsterdam, Noord Holland, The Netherlands"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Elsevier B.V., Amsterdam, Noord Holland, The Netherlands","institution_ids":["https://openalex.org/I1318003438"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5080654893","display_name":"George Tsatsaronis","orcid":"https://orcid.org/0000-0003-2116-2933"},"institutions":[{"id":"https://openalex.org/I1318003438","display_name":"RELX Group (Netherlands)","ror":"https://ror.org/02scfj030","country_code":"NL","type":"company","lineage":["https://openalex.org/I1318003438","https://openalex.org/I4210160603"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Georgios Tsatsaronis","raw_affiliation_strings":["Elsevier B.V., Amsterdam, Noord Holland, The Netherlands"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Elsevier B.V., Amsterdam, Noord Holland, The Netherlands","institution_ids":["https://openalex.org/I1318003438"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5004640276"],"corresponding_institution_ids":["https://openalex.org/I1318003438"],"apc_list":{"value":1190,"currency":"GBP","value_usd":1459},"apc_paid":{"value":1190,"currency":"GBP","value_usd":1459},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.03010965,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"17","issue":"1","first_page":"3","last_page":"3"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9107000231742859,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9107000231742859,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11642","display_name":"Genomics and Rare Diseases","score":0.038600001484155655,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.01549999974668026,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.7623000144958496},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5461000204086304},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5418000221252441},{"id":"https://openalex.org/keywords/operationalization","display_name":"Operationalization","score":0.4885999858379364},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.4700999855995178},{"id":"https://openalex.org/keywords/controlled-vocabulary","display_name":"Controlled vocabulary","score":0.37119999527931213},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.3601999878883362}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8744000196456909},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.7623000144958496},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5461000204086304},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5418000221252441},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4943000078201294},{"id":"https://openalex.org/C9354725","wikidata":"https://www.wikidata.org/wiki/Q286017","display_name":"Operationalization","level":2,"score":0.4885999858379364},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.4700999855995178},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.46149998903274536},{"id":"https://openalex.org/C110615152","wikidata":"https://www.wikidata.org/wiki/Q1469824","display_name":"Controlled vocabulary","level":2,"score":0.37119999527931213},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.3601999878883362},{"id":"https://openalex.org/C2778828372","wikidata":"https://www.wikidata.org/wiki/Q5283209","display_name":"Distributional semantics","level":3,"score":0.34279999136924744},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.34049999713897705},{"id":"https://openalex.org/C40077939","wikidata":"https://www.wikidata.org/wiki/Q2336004","display_name":"Semi-structured data","level":3,"score":0.310699999332428},{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.3018999993801117},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.29030001163482666},{"id":"https://openalex.org/C513874922","wikidata":"https://www.wikidata.org/wiki/Q212805","display_name":"Digital library","level":3,"score":0.2721000015735626},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.2687999904155731},{"id":"https://openalex.org/C96711827","wikidata":"https://www.wikidata.org/wiki/Q17012245","display_name":"Entity linking","level":3,"score":0.26409998536109924},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.2623000144958496},{"id":"https://openalex.org/C2781083858","wikidata":"https://www.wikidata.org/wiki/Q17327049","display_name":"Scientific literature","level":2,"score":0.258899986743927}],"mesh":[{"descriptor_ui":"D000043","descriptor_name":"Abstracting and Indexing","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D000043","descriptor_name":"Abstracting and Indexing","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":true},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012660","descriptor_name":"Semantics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012660","descriptor_name":"Semantics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D035583","descriptor_name":"Rare Diseases","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D035583","descriptor_name":"Rare Diseases","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D066289","descriptor_name":"Data Curation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D066289","descriptor_name":"Data Curation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":5,"locations":[{"id":"doi:10.1186/s13326-025-00346-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13326-025-00346-1","pdf_url":null,"source":{"id":"https://openalex.org/S172276550","display_name":"Journal of Biomedical Semantics","issn_l":"2041-1480","issn":["2041-1480"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Biomedical Semantics","raw_type":"journal-article"},{"id":"pmid:41495851","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41495851","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of biomedical semantics","raw_type":null},{"id":"pmh:oai:pure.eur.nl:openaire/ad9260fc-7b8a-45b0-8587-b32376b8384f","is_oa":true,"landing_page_url":"https://pure.eur.nl/en/publications/ad9260fc-7b8a-45b0-8587-b32376b8384f","pdf_url":null,"source":{"id":"https://openalex.org/S4306401266","display_name":"EUR Research Repository (Erasmus University Rotterdam)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I913958620","host_organization_name":"Erasmus University Rotterdam","host_organization_lineage":["https://openalex.org/I913958620"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Azarbonyad, H, Afzal, Z, Iping, R, Dumoulin, M, Nederveen, I, Yu, J & Tsatsaronis, G 2026, 'Annotating and indexing scientific articles with rare diseases', Journal of Biomedical Semantics, vol. 17, no. 1, 3. https://doi.org/10.1186/s13326-025-00346-1","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:doaj.org/article:cb253687d6014a46b096d1a78b90087f","is_oa":true,"landing_page_url":"https://doaj.org/article/cb253687d6014a46b096d1a78b90087f","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of Biomedical Semantics, Vol 17, Iss 1, Pp 1-13 (2026)","raw_type":"article"},{"id":"pmh:oai:europepmc.org:11678154","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/12870340","pdf_url":null,"source":{"id":"https://openalex.org/S4306400806","display_name":"Europe PMC (PubMed Central)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1303153112","host_organization_name":"European Bioinformatics Institute","host_organization_lineage":["https://openalex.org/I1303153112"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1186/s13326-025-00346-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13326-025-00346-1","pdf_url":null,"source":{"id":"https://openalex.org/S172276550","display_name":"Journal of Biomedical Semantics","issn_l":"2041-1480","issn":["2041-1480"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Biomedical Semantics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1971192989","https://openalex.org/W2085752173","https://openalex.org/W2114315281","https://openalex.org/W2149684865","https://openalex.org/W2152143870","https://openalex.org/W2159583324","https://openalex.org/W2318106356","https://openalex.org/W2562842110","https://openalex.org/W2739996966","https://openalex.org/W2788667846","https://openalex.org/W2911379778","https://openalex.org/W2918540534","https://openalex.org/W2919809473","https://openalex.org/W2929376427","https://openalex.org/W2937423263","https://openalex.org/W2954433047","https://openalex.org/W2963997607","https://openalex.org/W3007517974","https://openalex.org/W3106109117","https://openalex.org/W3156333129","https://openalex.org/W3171416056","https://openalex.org/W3198282417","https://openalex.org/W4385567242","https://openalex.org/W4393160356","https://openalex.org/W4400915868"],"related_works":[],"abstract_inverted_index":{"BACKGROUND:":[0],"Around":[1],"30":[2],"million":[3],"people":[4],"in":[5,20,24,210],"Europe":[6],"are":[7],"affected":[8],"by":[9,71,114],"a":[10,17,42,48,105],"rare":[11,44,61,93,202,228],"(or":[12],"orphan)":[13],"disease,":[14],"defined":[15],"as":[16],"condition":[18],"occurring":[19],"fewer":[21],"than":[22],"1":[23],"2,000":[25],"individuals.":[26],"The":[27],"primary":[28],"challenge":[29],"is":[30,69,191],"to":[31,51,154],"automatically":[32],"and":[33,38,53,86,89,128,143,162,168,182,200,215,219,230,235],"efficiently":[34],"identify":[35],"scientific":[36,55],"articles":[37],"guidelines":[39],"that":[40,107],"address":[41],"particular":[43],"disease.":[45],"We":[46,103],"present":[47],"novel":[49],"methodology":[50],"annotate":[52],"index":[54],"text":[56],"with":[57,119],"taxonomical":[58],"concepts":[59],"describing":[60],"diseases":[62,229],"from":[63],"the":[64,76,87,116,134,152,174,192,222,238],"OrphaNet":[65,109,209],"taxonomy.":[66],"This":[67],"task":[68],"complicated":[70],"several":[72],"technical":[73],"challenges,":[74],"including":[75],"lack":[77],"of":[78,92],"sufficiently":[79],"large,":[80],"human-annotated":[81],"datasets":[82],"for":[83,110,160,179,198,227],"supervised":[84],"training":[85],"polysemy/synonymy":[88],"surface-form":[90],"variation":[91],"disease":[94,203],"names,":[95],"which":[96],"can":[97],"hinder":[98],"any":[99],"annotation":[100,113],"engine.":[101],"RESULTS:":[102],"introduce":[104],"framework":[106,197],"operationalizes":[108],"large-scale":[111],"literature":[112,204],"integrating":[115],"TERMite":[117],"engine":[118],"curated":[120],"synonym":[121],"expansion,":[122],"label":[123],"normalization":[124],"(including":[125],"deprecated/renamed":[126],"concepts),":[127],"fuzzy":[129],"matching.":[130],"On":[131],"benchmark":[132],"datasets,":[133],"approach":[135],"achieves":[136],"precision":[137],"=":[138,141,145],"92%,":[139],"recall":[140],"75%,":[142],"F1":[144],"83%,":[146],"outperforming":[147],"an":[148,211],"string-matching":[149],"baseline.":[150],"Applying":[151],"pipeline":[153,214],"Scopus":[155],"produces":[156],"disease-specific":[157],"corpora":[158],"suitable":[159],"bibliometric":[161],"scientometric":[163],"analyses":[164],"(e.g.,":[165],"institution,":[166],"country,":[167],"subject-area":[169],"profiles).":[170],"These":[171],"outputs":[172],"power":[173],"Rare":[175],"Diseases":[176],"Monitor":[177],"dashboard":[178],"exploring":[180],"national":[181],"global":[183],"research":[184,239],"activity.":[185],"CONCLUSION:":[186],"To":[187],"our":[188],"knowledge,":[189],"this":[190],"first":[193],"systematic,":[194],"scalable":[195],"semantic":[196],"annotating":[199],"indexing":[201],"at":[205],"scale.":[206],"By":[207],"operationalizing":[208],"automated,":[212],"reproducible":[213],"addressing":[216],"data":[217],"scarcity":[218],"lexical":[220],"variability,":[221],"work":[223],"advances":[224],"biomedical":[225],"semantics":[226],"enables":[231],"disease-centric":[232],"monitoring,":[233],"evaluation,":[234],"discovery":[236],"across":[237],"landscape.":[240]},"counts_by_year":[],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2026-01-08T00:00:00"}
