{"id":"https://openalex.org/W7151502828","doi":"https://doi.org/10.1109/icmla66185.2025.00077","title":"Medical Imaging with Deep Learning: A Comparison of CNN and Transformer Models","display_name":"Medical Imaging with Deep Learning: A Comparison of CNN and Transformer Models","publication_year":2025,"publication_date":"2025-12-03","ids":{"openalex":"https://openalex.org/W7151502828","doi":"https://doi.org/10.1109/icmla66185.2025.00077"},"language":null,"primary_location":{"id":"doi:10.1109/icmla66185.2025.00077","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmla66185.2025.00077","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Machine Learning and Applications (ICMLA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109235962","display_name":"Kehan Gao","orcid":null},"institutions":[{"id":"https://openalex.org/I203331390","display_name":"Eastern Connecticut State University","ror":"https://ror.org/01mhgwt57","country_code":"US","type":"education","lineage":["https://openalex.org/I203331390","https://openalex.org/I4210132746"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Kehan Gao","raw_affiliation_strings":["Eastern Connecticut State University,Computer Science,Willimantic,CT,USA"],"affiliations":[{"raw_affiliation_string":"Eastern Connecticut State University,Computer Science,Willimantic,CT,USA","institution_ids":["https://openalex.org/I203331390"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113646357","display_name":"Sarah Tasneem","orcid":null},"institutions":[{"id":"https://openalex.org/I203331390","display_name":"Eastern Connecticut State University","ror":"https://ror.org/01mhgwt57","country_code":"US","type":"education","lineage":["https://openalex.org/I203331390","https://openalex.org/I4210132746"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sarah Tasneem","raw_affiliation_strings":["Eastern Connecticut State University,Computer Science,Willimantic,CT,USA"],"affiliations":[{"raw_affiliation_string":"Eastern Connecticut State University,Computer Science,Willimantic,CT,USA","institution_ids":["https://openalex.org/I203331390"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5089170562","display_name":"Taghi M. Khoshgoftaar","orcid":null},"institutions":[{"id":"https://openalex.org/I63772739","display_name":"Florida Atlantic University","ror":"https://ror.org/05p8w6387","country_code":"US","type":"education","lineage":["https://openalex.org/I63772739"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Taghi M. Khoshgoftaar","raw_affiliation_strings":["Florida Atlantic University,Electrical Engineering and Computer Science,Boca Raton,FL,USA"],"affiliations":[{"raw_affiliation_string":"Florida Atlantic University,Electrical Engineering and Computer Science,Boca Raton,FL,USA","institution_ids":["https://openalex.org/I63772739"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5109235962"],"corresponding_institution_ids":["https://openalex.org/I203331390"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.74923122,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"523","last_page":"530"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.21660000085830688,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.21660000085830688,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.05909999832510948,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.054999999701976776,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/medical-imaging","display_name":"Medical imaging","score":0.6100000143051147},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.38909998536109924},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3418000042438507},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.25519999861717224},{"id":"https://openalex.org/keywords/medical-diagnosis","display_name":"Medical diagnosis","score":0.2524000108242035}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6244000196456909},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.6100000143051147},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5764999985694885},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5562000274658203},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.38909998536109924},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3418000042438507},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.25519999861717224},{"id":"https://openalex.org/C534262118","wikidata":"https://www.wikidata.org/wiki/Q177719","display_name":"Medical diagnosis","level":2,"score":0.2524000108242035},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2515999972820282},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.24580000340938568}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icmla66185.2025.00077","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icmla66185.2025.00077","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Machine Learning and Applications (ICMLA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W2183341477","https://openalex.org/W2533800772","https://openalex.org/W2788633781","https://openalex.org/W3131500599","https://openalex.org/W4312349930","https://openalex.org/W4319300365","https://openalex.org/W4321232185","https://openalex.org/W4378528007","https://openalex.org/W4411024755"],"related_works":[],"abstract_inverted_index":{"This":[0,106],"study":[1],"presents":[2],"a":[3,125,129],"comprehensive":[4],"evaluation":[5],"of":[6,30,138,156],"deep":[7],"learning":[8],"approaches":[9],"for":[10,102,109,159],"medical":[11,54,72,148],"image":[12],"classification":[13,66],"tasks,":[14],"focusing":[15],"on":[16],"both":[17,60,91],"convolutional":[18],"neural":[19],"networks":[20],"(CNNs)":[21],"and":[22,36,38,46,63,93],"transformer-based":[23,40,80,157],"models.":[24],"Specifically,":[25],"we":[26],"assess":[27],"the":[28,95,139,154],"performance":[29,90,133],"three":[31,39,51],"CNN":[32,126],"architectures":[33],"(InceptionNet,":[34],"DenseNet,":[35],"EfficientNet)":[37],"models":[41,81,142,158],"(Vision":[42],"Transformer,":[43,45],"Swin":[44],"Pyramid":[47],"Vision":[48],"Transformer)":[49],"using":[50],"publicly":[52],"available":[53],"imaging":[55,149],"datasets.":[56],"These":[57,151],"datasets":[58],"represent":[59],"balanced":[61],"multi-class":[62],"imbalanced":[64],"binary":[65],"scenarios,":[67],"reflecting":[68],"real-world":[69],"challenges":[70],"in":[71,100,118,121,145],"diagnostics.":[73],"The":[74],"experimental":[75],"results":[76],"consistently":[77],"show":[78],"that":[79,137],"outperform":[82],"conventional":[83],"CNNs":[84],"across":[85],"all":[86],"datasets,":[87],"demonstrating":[88],"superior":[89],"overall":[92],"at":[94],"individual":[96],"class":[97],"level,":[98],"particularly":[99],"recall":[101,164],"clinically":[103],"critical":[104],"classes.":[105],"is":[107,165],"crucial":[108],"minimizing":[110],"severe":[111],"Type":[112],"II":[113],"errors,":[114],"which":[115],"can":[116],"result":[117],"missed":[119],"diagnoses":[120],"practice.":[122],"While":[123],"EfficientNet,":[124],"architecture,":[127],"remains":[128],"strong":[130],"baseline":[131],"with":[132],"often":[134],"comparable":[135],"to":[136],"transformers,":[140],"attention-based":[141],"demonstrate":[143],"effectiveness":[144],"handling":[146],"complex":[147],"tasks.":[150],"findings":[152],"underscore":[153],"potential":[155],"clinical":[160],"deployment":[161],"when":[162],"high":[163],"essential.":[166]},"counts_by_year":[],"updated_date":"2026-04-09T06:08:40.794217","created_date":"2026-04-08T00:00:00"}
