{"id":"https://openalex.org/W4393317613","doi":"https://doi.org/10.3390/a17040144","title":"Aiding ICD-10 Encoding of Clinical Health Records Using Improved Text Cosine Similarity and PLM-ICD","display_name":"Aiding ICD-10 Encoding of Clinical Health Records Using Improved Text Cosine Similarity and PLM-ICD","publication_year":2024,"publication_date":"2024-03-29","ids":{"openalex":"https://openalex.org/W4393317613","doi":"https://doi.org/10.3390/a17040144"},"language":"en","primary_location":{"id":"doi:10.3390/a17040144","is_oa":true,"landing_page_url":"https://doi.org/10.3390/a17040144","pdf_url":"https://www.mdpi.com/1999-4893/17/4/144/pdf?version=1711707561","source":{"id":"https://openalex.org/S190629608","display_name":"Algorithms","issn_l":"1999-4893","issn":["1999-4893"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/1999-4893/17/4/144/pdf?version=1711707561","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067090259","display_name":"Hugo Silva","orcid":"https://orcid.org/0000-0003-1184-2433"},"institutions":[{"id":"https://openalex.org/I293362453","display_name":"Polytechnic Institute of Coimbra","ror":"https://ror.org/01n8x4993","country_code":"PT","type":"education","lineage":["https://openalex.org/I293362453"]}],"countries":["PT"],"is_corresponding":true,"raw_author_name":"Hugo Silva","raw_affiliation_strings":["Polytechnic Institute of Coimbra, Coimbra Institute of Engineering, Rua Pedro Nunes\u2013Quinta da Nora, 3030-199 Coimbra, Portugal"],"raw_orcid":"https://orcid.org/0000-0003-1184-2433","affiliations":[{"raw_affiliation_string":"Polytechnic Institute of Coimbra, Coimbra Institute of Engineering, Rua Pedro Nunes\u2013Quinta da Nora, 3030-199 Coimbra, Portugal","institution_ids":["https://openalex.org/I293362453"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054376707","display_name":"V\u00edtor Duque","orcid":"https://orcid.org/0000-0003-0000-4004"},"institutions":[{"id":"https://openalex.org/I76903346","display_name":"University of Coimbra","ror":"https://ror.org/04z8k9a98","country_code":"PT","type":"education","lineage":["https://openalex.org/I76903346"]}],"countries":["PT"],"is_corresponding":false,"raw_author_name":"V\u00edtor Duque","raw_affiliation_strings":["Department of Infectious Diseases, Coimbra Hospital and University Centre, 3000-075 Coimbra, Portugal"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Infectious Diseases, Coimbra Hospital and University Centre, 3000-075 Coimbra, Portugal","institution_ids":["https://openalex.org/I76903346"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043618291","display_name":"M\u00e1rio Macedo","orcid":"https://orcid.org/0000-0002-4145-7301"},"institutions":[{"id":"https://openalex.org/I4210125590","display_name":"Institute for Systems Engineering and Computers","ror":"https://ror.org/033wn8m60","country_code":"PT","type":"nonprofit","lineage":["https://openalex.org/I4210125590"]},{"id":"https://openalex.org/I4405259463","display_name":"Institut des Sciences et technologies pour une Economie Circulaire des \u00e9nergies bas carbone","ror":"https://ror.org/0298wh711","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131","https://openalex.org/I4405259463"]}],"countries":["FR","PT"],"is_corresponding":false,"raw_author_name":"M\u00e1rio Macedo","raw_affiliation_strings":["RCM2+ Research Centre for Asset Management and Systems Engineering, ISEC/IPC, Rua Pedro Nunes, 3030-199 Coimbra, Portugal"],"raw_orcid":"https://orcid.org/0000-0002-4145-7301","affiliations":[{"raw_affiliation_string":"RCM2+ Research Centre for Asset Management and Systems Engineering, ISEC/IPC, Rua Pedro Nunes, 3030-199 Coimbra, Portugal","institution_ids":["https://openalex.org/I4210125590","https://openalex.org/I4405259463"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5026269967","display_name":"Mateus Mendes","orcid":"https://orcid.org/0000-0003-4313-7966"},"institutions":[{"id":"https://openalex.org/I293362453","display_name":"Polytechnic Institute of Coimbra","ror":"https://ror.org/01n8x4993","country_code":"PT","type":"education","lineage":["https://openalex.org/I293362453"]}],"countries":["PT"],"is_corresponding":true,"raw_author_name":"Mateus Mendes","raw_affiliation_strings":["Polytechnic Institute of Coimbra, Coimbra Institute of Engineering, Rua Pedro Nunes\u2013Quinta da Nora, 3030-199 Coimbra, Portugal"],"raw_orcid":"https://orcid.org/0000-0003-4313-7966","affiliations":[{"raw_affiliation_string":"Polytechnic Institute of Coimbra, Coimbra Institute of Engineering, Rua Pedro Nunes\u2013Quinta da Nora, 3030-199 Coimbra, Portugal","institution_ids":["https://openalex.org/I293362453"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5026269967","https://openalex.org/A5067090259"],"corresponding_institution_ids":["https://openalex.org/I293362453"],"apc_list":{"value":1400,"currency":"CHF","value_usd":1515},"apc_paid":{"value":1400,"currency":"CHF","value_usd":1515},"fwci":0.6331,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.66434554,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":"17","issue":"4","first_page":"144","last_page":"144"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9926000237464905,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9911999702453613,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.7001609206199646},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.6514492630958557},{"id":"https://openalex.org/keywords/icd-10","display_name":"ICD-10","score":0.6394894123077393},{"id":"https://openalex.org/keywords/cosine-similarity","display_name":"Cosine similarity","score":0.6063832640647888},{"id":"https://openalex.org/keywords/health-records","display_name":"Health records","score":0.5596776008605957},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5394085645675659},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3860059976577759},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.34782740473747253},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.2779850959777832},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.24178755283355713},{"id":"https://openalex.org/keywords/health-care","display_name":"Health care","score":0.07966563105583191}],"concepts":[{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.7001609206199646},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.6514492630958557},{"id":"https://openalex.org/C2781116378","wikidata":"https://www.wikidata.org/wiki/Q45127","display_name":"ICD-10","level":2,"score":0.6394894123077393},{"id":"https://openalex.org/C2780762811","wikidata":"https://www.wikidata.org/wiki/Q1784941","display_name":"Cosine similarity","level":3,"score":0.6063832640647888},{"id":"https://openalex.org/C3019952477","wikidata":"https://www.wikidata.org/wiki/Q1324077","display_name":"Health records","level":3,"score":0.5596776008605957},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5394085645675659},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3860059976577759},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34782740473747253},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.2779850959777832},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.24178755283355713},{"id":"https://openalex.org/C160735492","wikidata":"https://www.wikidata.org/wiki/Q31207","display_name":"Health care","level":2,"score":0.07966563105583191},{"id":"https://openalex.org/C118552586","wikidata":"https://www.wikidata.org/wiki/Q7867","display_name":"Psychiatry","level":1,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3390/a17040144","is_oa":true,"landing_page_url":"https://doi.org/10.3390/a17040144","pdf_url":"https://www.mdpi.com/1999-4893/17/4/144/pdf?version=1711707561","source":{"id":"https://openalex.org/S190629608","display_name":"Algorithms","issn_l":"1999-4893","issn":["1999-4893"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:943b00aaf73644ff9cff5336867a2f31","is_oa":true,"landing_page_url":"https://doaj.org/article/943b00aaf73644ff9cff5336867a2f31","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Algorithms, Vol 17, Iss 4, p 144 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.3390/a17040144","is_oa":true,"landing_page_url":"https://doi.org/10.3390/a17040144","pdf_url":"https://www.mdpi.com/1999-4893/17/4/144/pdf?version=1711707561","source":{"id":"https://openalex.org/S190629608","display_name":"Algorithms","issn_l":"1999-4893","issn":["1999-4893"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.699999988079071,"display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G7082142669","display_name":null,"funder_award_id":"022153","funder_id":"https://openalex.org/F4320334779","funder_display_name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia"},{"id":"https://openalex.org/G7991599336","display_name":null,"funder_award_id":"01/SAICT/2016","funder_id":"https://openalex.org/F4320334779","funder_display_name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia"}],"funders":[{"id":"https://openalex.org/F4320334779","display_name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia","ror":"https://ror.org/00snfqn58"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4393317613.pdf"},"referenced_works_count":30,"referenced_works":["https://openalex.org/W2146417320","https://openalex.org/W2177350256","https://openalex.org/W2410696340","https://openalex.org/W2768917383","https://openalex.org/W2911489562","https://openalex.org/W2911842235","https://openalex.org/W2963716420","https://openalex.org/W2964142373","https://openalex.org/W2997050424","https://openalex.org/W3002784191","https://openalex.org/W3035294872","https://openalex.org/W3037562983","https://openalex.org/W3046375318","https://openalex.org/W3093904885","https://openalex.org/W3100452049","https://openalex.org/W3101475827","https://openalex.org/W3103901889","https://openalex.org/W3160596727","https://openalex.org/W3181361218","https://openalex.org/W3198282417","https://openalex.org/W4210603761","https://openalex.org/W4287854971","https://openalex.org/W4313439128","https://openalex.org/W4366835582","https://openalex.org/W4391729322","https://openalex.org/W6758789004","https://openalex.org/W6781031682","https://openalex.org/W6808012567","https://openalex.org/W6810673871","https://openalex.org/W6859363318"],"related_works":["https://openalex.org/W2389818373","https://openalex.org/W2220831889","https://openalex.org/W4312683641","https://openalex.org/W3027421045","https://openalex.org/W2576320324","https://openalex.org/W2980386803","https://openalex.org/W3215994059","https://openalex.org/W2319823519","https://openalex.org/W4206798987","https://openalex.org/W2801158176"],"abstract_inverted_index":{"The":[0,102],"International":[1],"Classification":[2],"of":[3,15,46,84,88,108,130],"Diseases,":[4],"10th":[5],"edition":[6],"(ICD-10),":[7],"has":[8],"been":[9,54],"widely":[10],"used":[11],"for":[12,43,97],"the":[13,44,58,82,93,117,121,128,135,149],"classification":[14,20,38,59],"patient":[16],"diagnostic":[17],"information.":[18],"This":[19,61],"is":[21,33,39,70],"usually":[22],"performed":[23],"by":[24,134],"dedicated":[25],"physicians":[26],"with":[27,72],"specific":[28],"coding":[29],"training,":[30],"and":[31,112,138],"it":[32],"a":[34,40,64,73,106,131],"laborious":[35],"task.":[36],"Automatic":[37],"challenging":[41],"task":[42],"domain":[45],"natural":[47],"language":[48,75],"processing.":[49],"Therefore,":[50],"automatic":[51],"methods":[52],"have":[53],"proposed":[55],"to":[56,80],"aid":[57],"process.":[60],"paper":[62],"proposes":[63],"method":[65,137],"where":[66],"Cosine":[67,118,136],"text":[68],"similarity":[69],"combined":[71],"pretrained":[74],"model,":[76],"PLM-ICD,":[77,139],"in":[78,116],"order":[79],"increase":[81],"number":[83],"probably":[85],"useful":[86,125],"suggestions":[87],"ICD-10":[89],"codes,":[90],"based":[91],"on":[92],"Medical":[94],"Information":[95],"Mart":[96],"Intensive":[98],"Care":[99],"(MIMIC)-IV":[100],"dataset.":[101],"results":[103,146],"show":[104],"that":[105],"strategy":[107,132],"using":[109],"multiple":[110],"runs,":[111],"bucket":[113],"category":[114],"search,":[115],"method,":[119],"improves":[120],"results,":[122],"providing":[123],"more":[124],"suggestions.":[126],"Also,":[127],"use":[129],"composed":[133],"which":[140],"was":[141],"called":[142],"PLM-ICD-C,":[143],"provides":[144],"better":[145],"than":[147],"just":[148],"PLM-ICD.":[150]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
