{"id":"https://openalex.org/W7116748712","doi":"https://doi.org/10.1109/access.2025.3646756","title":"HeaRT: An Innovative Health Representation Transformer With Clustered Feature Augmentation for Biomedical Text Classification","display_name":"HeaRT: An Innovative Health Representation Transformer With Clustered Feature Augmentation for Biomedical Text Classification","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W7116748712","doi":"https://doi.org/10.1109/access.2025.3646756"},"language":null,"primary_location":{"id":"doi:10.1109/access.2025.3646756","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3646756","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2025.3646756","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120963289","display_name":"Merve Pinar","orcid":null},"institutions":[{"id":"https://openalex.org/I44457188","display_name":"Maltepe University","ror":"https://ror.org/004dg2369","country_code":"TR","type":"education","lineage":["https://openalex.org/I44457188"]},{"id":"https://openalex.org/I74897591","display_name":"Marmara University","ror":"https://ror.org/02kswqa67","country_code":"TR","type":"education","lineage":["https://openalex.org/I74897591"]}],"countries":["TR"],"is_corresponding":true,"raw_author_name":"Merve Pinar","raw_affiliation_strings":["Department of Computer Engineering, Faculty of Technology, Marmara University, Maltepe, \u0130stanbul, T&#x00FC;rkiye"],"raw_orcid":"https://orcid.org/0000-0003-3041-6958","affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Faculty of Technology, Marmara University, Maltepe, \u0130stanbul, T&#x00FC;rkiye","institution_ids":["https://openalex.org/I44457188","https://openalex.org/I74897591"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120947944","display_name":"Ayse Berna Altinel","orcid":null},"institutions":[{"id":"https://openalex.org/I44457188","display_name":"Maltepe University","ror":"https://ror.org/004dg2369","country_code":"TR","type":"education","lineage":["https://openalex.org/I44457188"]},{"id":"https://openalex.org/I74897591","display_name":"Marmara University","ror":"https://ror.org/02kswqa67","country_code":"TR","type":"education","lineage":["https://openalex.org/I74897591"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Ayse Berna Altinel","raw_affiliation_strings":["Department of Computer Engineering, Faculty of Technology, Marmara University, Maltepe, \u0130stanbul, T&#x00FC;rkiye"],"raw_orcid":"https://orcid.org/0000-0001-5544-0925","affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Faculty of Technology, Marmara University, Maltepe, \u0130stanbul, T&#x00FC;rkiye","institution_ids":["https://openalex.org/I44457188","https://openalex.org/I74897591"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079918798","display_name":"Abdulsamet Akta\u015f","orcid":"https://orcid.org/0000-0003-0746-7693"},"institutions":[{"id":"https://openalex.org/I44457188","display_name":"Maltepe University","ror":"https://ror.org/004dg2369","country_code":"TR","type":"education","lineage":["https://openalex.org/I44457188"]},{"id":"https://openalex.org/I74897591","display_name":"Marmara University","ror":"https://ror.org/02kswqa67","country_code":"TR","type":"education","lineage":["https://openalex.org/I74897591"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Abdulsamet Aktas","raw_affiliation_strings":["Department of Computer Engineering, Faculty of Technology, Marmara University, Maltepe, \u0130stanbul, T&#x00FC;rkiye"],"raw_orcid":"https://orcid.org/0000-0003-0746-7693","affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Faculty of Technology, Marmara University, Maltepe, \u0130stanbul, T&#x00FC;rkiye","institution_ids":["https://openalex.org/I44457188","https://openalex.org/I74897591"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5120963289"],"corresponding_institution_ids":["https://openalex.org/I44457188","https://openalex.org/I74897591"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.79610877,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"13","issue":null,"first_page":"215748","last_page":"215770"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.41780000925064087,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.41780000925064087,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.18690000474452972,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.13920000195503235,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.4893999993801117},{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.47609999775886536},{"id":"https://openalex.org/keywords/weighting","display_name":"Weighting","score":0.426800012588501},{"id":"https://openalex.org/keywords/health-informatics","display_name":"Health informatics","score":0.42579999566078186},{"id":"https://openalex.org/keywords/medical-classification","display_name":"Medical classification","score":0.40529999136924744},{"id":"https://openalex.org/keywords/unified-medical-language-system","display_name":"Unified Medical Language System","score":0.37310001254081726},{"id":"https://openalex.org/keywords/clinical-decision-support-system","display_name":"Clinical decision support system","score":0.3610999882221222},{"id":"https://openalex.org/keywords/adaboost","display_name":"AdaBoost","score":0.3513000011444092},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.3441999852657318}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7943000197410583},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6567000150680542},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.4893999993801117},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.47609999775886536},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4507000148296356},{"id":"https://openalex.org/C183115368","wikidata":"https://www.wikidata.org/wiki/Q856577","display_name":"Weighting","level":2,"score":0.426800012588501},{"id":"https://openalex.org/C145642194","wikidata":"https://www.wikidata.org/wiki/Q870895","display_name":"Health informatics","level":3,"score":0.42579999566078186},{"id":"https://openalex.org/C154874363","wikidata":"https://www.wikidata.org/wiki/Q3518464","display_name":"Medical classification","level":2,"score":0.40529999136924744},{"id":"https://openalex.org/C69505689","wikidata":"https://www.wikidata.org/wiki/Q455338","display_name":"Unified Medical Language System","level":2,"score":0.37310001254081726},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.36820000410079956},{"id":"https://openalex.org/C63527458","wikidata":"https://www.wikidata.org/wiki/Q5133829","display_name":"Clinical decision support system","level":3,"score":0.3610999882221222},{"id":"https://openalex.org/C141404830","wikidata":"https://www.wikidata.org/wiki/Q2823869","display_name":"AdaBoost","level":3,"score":0.3513000011444092},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3441999852657318},{"id":"https://openalex.org/C92835128","wikidata":"https://www.wikidata.org/wiki/Q1277447","display_name":"Hierarchical clustering","level":3,"score":0.3400000035762787},{"id":"https://openalex.org/C66782513","wikidata":"https://www.wikidata.org/wiki/Q864601","display_name":"Biomedicine","level":2,"score":0.3255000114440918},{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.3239000141620636},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.32330000400543213},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3181999921798706},{"id":"https://openalex.org/C534262118","wikidata":"https://www.wikidata.org/wiki/Q177719","display_name":"Medical diagnosis","level":2,"score":0.30559998750686646},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.3052000105381012},{"id":"https://openalex.org/C110083411","wikidata":"https://www.wikidata.org/wiki/Q1744628","display_name":"Statistical classification","level":2,"score":0.29170000553131104},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.28220000863075256},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.28049999475479126},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.28029999136924744},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.2775999903678894},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2721000015735626},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.2702000141143799},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.26759999990463257},{"id":"https://openalex.org/C71472368","wikidata":"https://www.wikidata.org/wiki/Q676880","display_name":"Text mining","level":2,"score":0.258899986743927},{"id":"https://openalex.org/C84525736","wikidata":"https://www.wikidata.org/wiki/Q831366","display_name":"Decision tree","level":2,"score":0.25519999861717224},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.2542000114917755},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.2517000138759613}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/access.2025.3646756","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3646756","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1109/access.2025.3646756","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3646756","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.45692333579063416,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":61,"referenced_works":["https://openalex.org/W1881830221","https://openalex.org/W1970187450","https://openalex.org/W1972794504","https://openalex.org/W2011430131","https://openalex.org/W2049017883","https://openalex.org/W2056132907","https://openalex.org/W2088794999","https://openalex.org/W2091825929","https://openalex.org/W2140321362","https://openalex.org/W2185735639","https://openalex.org/W2216946510","https://openalex.org/W2330219538","https://openalex.org/W2609923048","https://openalex.org/W2623340684","https://openalex.org/W2772121968","https://openalex.org/W2896457183","https://openalex.org/W2911489562","https://openalex.org/W2912097622","https://openalex.org/W2927032858","https://openalex.org/W2927746189","https://openalex.org/W2941323306","https://openalex.org/W2965373594","https://openalex.org/W2970641574","https://openalex.org/W2999191191","https://openalex.org/W3004382610","https://openalex.org/W3005971956","https://openalex.org/W3021618059","https://openalex.org/W3037016244","https://openalex.org/W3135832423","https://openalex.org/W3170382704","https://openalex.org/W3201908633","https://openalex.org/W4221110957","https://openalex.org/W4251372957","https://openalex.org/W4283593236","https://openalex.org/W4283715676","https://openalex.org/W4283785590","https://openalex.org/W4283791631","https://openalex.org/W4296079469","https://openalex.org/W4299687112","https://openalex.org/W4303983263","https://openalex.org/W4308866759","https://openalex.org/W4310522573","https://openalex.org/W4322012984","https://openalex.org/W4327566711","https://openalex.org/W4362589072","https://openalex.org/W4363650638","https://openalex.org/W4365129631","https://openalex.org/W4382201643","https://openalex.org/W4389485036","https://openalex.org/W4391454432","https://openalex.org/W4391892062","https://openalex.org/W4394711871","https://openalex.org/W4399110344","https://openalex.org/W4399647672","https://openalex.org/W4399727970","https://openalex.org/W4400762160","https://openalex.org/W4402540481","https://openalex.org/W4402747738","https://openalex.org/W4404450987","https://openalex.org/W4404628842","https://openalex.org/W4409885654"],"related_works":[],"abstract_inverted_index":{"Medical":[0,141,172],"text":[1,209],"classification":[2,33],"(MTC)":[3],"poses":[4],"significant":[5],"challenges":[6],"in":[7,216],"health":[8],"informatics":[9,225],"due":[10],"to":[11,55,84,103],"contextual":[12,62,89],"complexity,":[13],"class":[14],"imbalance,":[15],"and":[16,31,39,64,88,99,106,119,143,148,157,174,204,223],"limited":[17],"labeled":[18,38],"data.":[19],"This":[20],"study":[21,54],"introduces":[22],"<italic":[23],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[24],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">HeaRT":[25],"(Health":[26],"Representation":[27],"Transformer)</i>,":[28],"a":[29,69,201],"novel":[30],"explainable":[32],"framework":[34,134],"tailored":[35],"for":[36,74,207,214],"sparsely":[37],"semantically":[40],"complex":[41],"medical":[42,208],"texts.":[43],"To":[44,109],"the":[45,52,129,144,179,187],"best":[46],"of":[47,167,190],"our":[48],"knowledge,":[49],"this":[50],"is":[51,101,135,149],"first":[53],"systematically":[56],"combine":[57],"TF-based":[58,78],"lexical":[59,79,87],"weighting,":[60],"SBERT":[61,82],"embeddings,":[63],"cluster-enhanced":[65],"structural":[66],"features":[67,115],"within":[68],"unified":[70],"multi-vector":[71],"fusion":[72],"architecture":[73],"MTC.":[75],"HeaRT":[76,163,199],"combines":[77],"weighting":[80],"with":[81,169,176,211],"embeddings":[83],"capture":[85],"both":[86],"nuances.":[90],"A":[91],"hybrid":[92],"feature":[93],"selection":[94],"mechanism":[95],"based":[96],"on":[97,137,171,178],"ANOVA":[98],"SHAP":[100],"employed":[102],"reduce":[104],"redundancy":[105],"improve":[107],"interpretability.":[108],"further":[110],"enhance":[111],"representational":[112],"capacity,":[113],"cluster-derived":[114],"from":[116],"K-means,":[117],"DBSCAN,":[118],"Agglomerative":[120],"Clustering":[121],"are":[122],"added,":[123],"introducing":[124],"topological":[125],"structure":[126],"awareness":[127],"into":[128],"learning":[130],"process.":[131],"The":[132],"proposed":[133],"evaluated":[136],"two":[138],"benchmark":[139],"datasets:":[140],"Abstracts":[142,173],"Biomedical":[145,180],"Text":[146,181],"Dataset,":[147],"compared":[150],"against":[151],"state-of-the-art":[152],"models":[153],"such":[154],"as":[155,200],"BERT,":[156],"Doc2Sequence.":[158],"Experimental":[159],"results":[160,185],"reveal":[161],"that":[162],"achieves":[164],"an":[165],"F1-score":[166],"60.74%":[168],"AdaBoost":[170],"94.02%":[175],"LightGBM":[177],"Dataset.":[182],"Paired":[183],"t-test":[184],"confirm":[186],"statistical":[188],"significance":[189],"these":[191],"gains":[192],"(p":[193],"<":[194],"0.05).":[195],"These":[196],"findings":[197],"establish":[198],"robust,":[202],"interpretable,":[203],"extensible":[205],"solution":[206],"classification,":[210],"strong":[212],"potential":[213],"deployment":[215],"clinical":[217],"decision":[218],"support,":[219],"biomedical":[220],"literature":[221],"mining,":[222],"healthcare":[224],"applications.":[226]},"counts_by_year":[],"updated_date":"2025-12-30T23:08:21.542490","created_date":"2025-12-22T00:00:00"}
