{"id":"https://openalex.org/W4393932132","doi":"https://doi.org/10.1186/s40537-024-00903-y","title":"Adapting transformer-based language models for heart disease detection and risk factors extraction","display_name":"Adapting transformer-based language models for heart disease detection and risk factors extraction","publication_year":2024,"publication_date":"2024-04-04","ids":{"openalex":"https://openalex.org/W4393932132","doi":"https://doi.org/10.1186/s40537-024-00903-y"},"language":"en","primary_location":{"id":"doi:10.1186/s40537-024-00903-y","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-024-00903-y","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-024-00903-y","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-024-00903-y","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056436780","display_name":"Essam H. Houssein","orcid":"https://orcid.org/0000-0002-8127-7233"},"institutions":[{"id":"https://openalex.org/I89466785","display_name":"Minia University","ror":"https://ror.org/02hcv4z63","country_code":"EG","type":"education","lineage":["https://openalex.org/I89466785"]}],"countries":["EG"],"is_corresponding":true,"raw_author_name":"Essam H. Houssein","raw_affiliation_strings":["Faculty of Computers and Information, Minia University, Minia, Egypt"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Computers and Information, Minia University, Minia, Egypt","institution_ids":["https://openalex.org/I89466785"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076970771","display_name":"Rehab E. Mohamed","orcid":null},"institutions":[{"id":"https://openalex.org/I89466785","display_name":"Minia University","ror":"https://ror.org/02hcv4z63","country_code":"EG","type":"education","lineage":["https://openalex.org/I89466785"]}],"countries":["EG"],"is_corresponding":false,"raw_author_name":"Rehab E. Mohamed","raw_affiliation_strings":["Faculty of Computers and Information, Minia University, Minia, Egypt"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Computers and Information, Minia University, Minia, Egypt","institution_ids":["https://openalex.org/I89466785"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101617943","display_name":"Guang Hu","orcid":"https://orcid.org/0000-0002-8754-1541"},"institutions":[{"id":"https://openalex.org/I4210131919","display_name":"Xi'an University of Technology","ror":"https://ror.org/038avdt50","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210131919"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gang Hu","raw_affiliation_strings":["Department of Applied Mathematics, Xi\u2019an University of Technology, Xi\u2019an, 710054, China","Department of Applied Mathematics, Xi'an University of Technology, Xi'an, 710054, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Applied Mathematics, Xi\u2019an University of Technology, Xi\u2019an, 710054, China","institution_ids":["https://openalex.org/I4210131919"]},{"raw_affiliation_string":"Department of Applied Mathematics, Xi'an University of Technology, Xi'an, 710054, China","institution_ids":["https://openalex.org/I4210131919"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5114334565","display_name":"Abdelmgeid A. Ali","orcid":null},"institutions":[{"id":"https://openalex.org/I89466785","display_name":"Minia University","ror":"https://ror.org/02hcv4z63","country_code":"EG","type":"education","lineage":["https://openalex.org/I89466785"]}],"countries":["EG"],"is_corresponding":false,"raw_author_name":"Abdelmgeid A. Ali","raw_affiliation_strings":["Faculty of Computers and Information, Minia University, Minia, Egypt"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Computers and Information, Minia University, Minia, Egypt","institution_ids":["https://openalex.org/I89466785"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5056436780"],"corresponding_institution_ids":["https://openalex.org/I89466785"],"apc_list":{"value":1060,"currency":"GBP","value_usd":1300},"apc_paid":{"value":1060,"currency":"GBP","value_usd":1300},"fwci":13.1312,"has_fulltext":true,"cited_by_count":21,"citation_normalized_percentile":{"value":0.98497744,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":"11","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11396","display_name":"Artificial Intelligence in Healthcare","score":0.9909999966621399,"subfield":{"id":"https://openalex.org/subfields/3605","display_name":"Health Information Management"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11396","display_name":"Artificial Intelligence in Healthcare","score":0.9909999966621399,"subfield":{"id":"https://openalex.org/subfields/3605","display_name":"Health Information Management"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.9904999732971191,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9735999703407288,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.797360897064209},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5321003198623657},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.39060136675834656},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3608967661857605},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.36052292585372925}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.797360897064209},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5321003198623657},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39060136675834656},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3608967661857605},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.36052292585372925},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1186/s40537-024-00903-y","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-024-00903-y","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-024-00903-y","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:5bbe9433fe8b441db9a0fcb0dd504179","is_oa":false,"landing_page_url":"https://doaj.org/article/5bbe9433fe8b441db9a0fcb0dd504179","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of Big Data, Vol 11, Iss 1, Pp 1-27 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/s40537-024-00903-y","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-024-00903-y","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-024-00903-y","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Good health and well-being","score":0.5699999928474426,"id":"https://metadata.un.org/sdg/3"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321655","display_name":"Science and Technology Development Fund","ror":"https://ror.org/044vr6g03"},{"id":"https://openalex.org/F4320327648","display_name":"Minia University","ror":"https://ror.org/02hcv4z63"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4393932132.pdf"},"referenced_works_count":67,"referenced_works":["https://openalex.org/W283797413","https://openalex.org/W833343209","https://openalex.org/W942379102","https://openalex.org/W1019512417","https://openalex.org/W1034019924","https://openalex.org/W1081873870","https://openalex.org/W1126062418","https://openalex.org/W1451372127","https://openalex.org/W1614298861","https://openalex.org/W1656216251","https://openalex.org/W1737136247","https://openalex.org/W1964625659","https://openalex.org/W2114039834","https://openalex.org/W2114388055","https://openalex.org/W2123442489","https://openalex.org/W2124972954","https://openalex.org/W2133990480","https://openalex.org/W2139521168","https://openalex.org/W2151477381","https://openalex.org/W2153635508","https://openalex.org/W2159636537","https://openalex.org/W2165698076","https://openalex.org/W2168924589","https://openalex.org/W2187005605","https://openalex.org/W2396881363","https://openalex.org/W2493916176","https://openalex.org/W2547728652","https://openalex.org/W2768092558","https://openalex.org/W2885828205","https://openalex.org/W2889877784","https://openalex.org/W2893364991","https://openalex.org/W2899736836","https://openalex.org/W2911489562","https://openalex.org/W2912042784","https://openalex.org/W2913705661","https://openalex.org/W2923014074","https://openalex.org/W2939470209","https://openalex.org/W2944400536","https://openalex.org/W2950813464","https://openalex.org/W2963354094","https://openalex.org/W2963626623","https://openalex.org/W2963716420","https://openalex.org/W2970771982","https://openalex.org/W2971258845","https://openalex.org/W2971668428","https://openalex.org/W2972984751","https://openalex.org/W2981852735","https://openalex.org/W2985884876","https://openalex.org/W3003943678","https://openalex.org/W3004227146","https://openalex.org/W3007060302","https://openalex.org/W3025578374","https://openalex.org/W3034328552","https://openalex.org/W3035204084","https://openalex.org/W3035375600","https://openalex.org/W3048989076","https://openalex.org/W3100452049","https://openalex.org/W3105063288","https://openalex.org/W3111112601","https://openalex.org/W3122886537","https://openalex.org/W3124523525","https://openalex.org/W3177034450","https://openalex.org/W3198196226","https://openalex.org/W4214644841","https://openalex.org/W4226269719","https://openalex.org/W4241818541","https://openalex.org/W6800751262"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W3046775127","https://openalex.org/W3107602296","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W4364306694","https://openalex.org/W4312192474","https://openalex.org/W4283697347","https://openalex.org/W4210805261"],"abstract_inverted_index":{"Abstract":[0],"Efficiently":[1],"treating":[2],"cardiac":[3],"patients":[4],"before":[5],"the":[6,14,23,126,162,203,214,241,261,276,291,300,326,335,353],"onset":[7],"of":[8,17,128,154,174,185,278,297,314,325,348,355],"a":[9,100,106,182,322,345],"heart":[10,18,27,91,119,149,199,230,279,340,370],"attack":[11],"relies":[12],"on":[13,170],"precise":[15],"prediction":[16,364],"disease.":[19],"Identifying":[20],"and":[21,44,52,146,152,177,211,235,258,304,318,365],"detecting":[22],"risk":[24,68,93,121,156,232,281,342,363],"factors":[25,94,157,282],"for":[26,48,65,75,148,369],"disease":[28,92,120,150,231,280,341,371],"such":[29,201],"as":[30,62,202],"diabetes":[31],"mellitus,":[32],"Coronary":[33],"Artery":[34],"Disease":[35],"(CAD),":[36],"hyperlipidemia,":[37],"hypertension,":[38],"smoking,":[39],"familial":[40],"CAD":[41],"history,":[42],"obesity,":[43],"medications":[45],"is":[46],"critical":[47],"developing":[49],"effective":[50],"preventative":[51],"management":[53],"measures.":[54],"Although":[55],"Electronic":[56],"Health":[57],"Records":[58],"(EHRs)":[59],"have":[60,218,307],"emerged":[61],"valuable":[63],"resources":[64],"identifying":[66],"these":[67],"factors,":[69],"their":[70],"unstructured":[71],"format":[72],"poses":[73],"challenges":[74],"cardiologists":[76],"in":[77,109,118,222,274,339,361],"retrieving":[78],"relevant":[79],"information.":[80],"This":[81,123,244,350],"research":[82],"proposed":[83,246],"employing":[84],"transfer":[85,98,356],"learning":[86,102,357],"techniques":[87],"to":[88,180,198,208],"automatically":[89],"extract":[90],"from":[95,141,158,226],"EHRs.":[96],"Leveraging":[97],"learning,":[99],"deep":[101,183],"technique":[103],"has":[104,289,330],"demonstrated":[105,219,352],"significant":[107],"performance":[108,221],"various":[110],"clinical":[111,159,178,242,264],"natural":[112],"language":[113,130,187],"processing":[114],"(NLP)":[115],"applications,":[116],"particularly":[117],"prediction.":[122],"study":[124,245,351],"explored":[125],"application":[127],"transformer-based":[129,251,328,359],"models,":[131,252],"specifically":[132],"utilizing":[133],"pre-trained":[134,169],"architectures":[135],"like":[136],"BERT":[137],"(Bidirectional":[138],"Encoder":[139],"Representations":[140],"Transformers),":[142],"RoBERTa,":[143,255],"BioClinicalBERT,":[144,256,302],"XLNet,":[145,257,303],"BioBERT":[147,305],"detection":[151],"extraction":[153],"related":[155],"notes,":[160],"using":[161,194,260,358],"i2b2":[163,204,263],"dataset.":[164,267],"These":[165,216],"transformer":[166],"models":[167,190,217,270,306,329,360],"are":[168,191],"an":[171],"extensive":[172],"corpus":[173],"medical":[175],"literature":[176],"records":[179],"gain":[181],"understanding":[184],"contextualized":[186],"representations.":[188],"Adapted":[189],"then":[192],"fine-tuned":[193,247,269],"annotated":[195],"datasets":[196],"specific":[197],"disease,":[200],"dataset,":[205],"enabling":[206],"them":[207],"learn":[209],"patterns":[210],"relationships":[212],"within":[213,240],"domain.":[215,243],"superior":[220],"extracting":[223],"semantic":[224],"information":[225],"EHRs,":[227],"automating":[228],"high-performance":[229],"factor":[233],"identification,":[234],"performing":[236],"downstream":[237],"NLP":[238,265],"tasks":[239],"five":[248,327],"widely":[249],"used":[250],"namely":[253],"BERT,":[254,301],"BioBERT,":[259],"2014":[262],"challenge":[266],"The":[268,286],"surpass":[271],"conventional":[272],"approaches":[273],"predicting":[275],"presence":[277],"with":[283,294,311],"impressive":[284],"accuracy.":[285],"RoBERTa":[287],"model":[288],"achieved":[290],"highest":[292],"performance,":[293],"micro":[295,312,346],"F1-scores":[296,313],"94.27%,":[298],"while":[299],"provided":[308],"competitive":[309],"performances":[310],"93.73%,":[315],"94.03%,":[316],"93.97%,":[317],"93.99%,":[319],"respectively.":[320],"Finally,":[321],"simple":[323],"ensemble":[324],"been":[331],"proposed,":[332],"which":[333],"outperformed":[334],"most":[336],"existing":[337],"methods":[338],"fan,":[343],"achieving":[344],"F1-Score":[347],"94.26%.":[349],"efficacy":[354],"enhancing":[362],"facilitating":[366],"early":[367],"intervention":[368],"prevention.":[372]},"counts_by_year":[{"year":2026,"cited_by_count":9},{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":4}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
