{"id":"https://openalex.org/W7161817067","doi":"https://doi.org/10.1109/isbi61048.2026.11515926","title":"Medical Small Object Detection Algorithm Based on Multi-Scale Frequency Domain Enhancement and Cross-Attention Fusion","display_name":"Medical Small Object Detection Algorithm Based on Multi-Scale Frequency Domain Enhancement and Cross-Attention Fusion","publication_year":2026,"publication_date":"2026-04-08","ids":{"openalex":"https://openalex.org/W7161817067","doi":"https://doi.org/10.1109/isbi61048.2026.11515926"},"language":null,"primary_location":{"id":"doi:10.1109/isbi61048.2026.11515926","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isbi61048.2026.11515926","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE 23rd International Symposium on Biomedical Imaging (ISBI)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136597156","display_name":"Qi Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Qi Wang","raw_affiliation_strings":["Institute of Automation, Chinese Academy of Sciences,State Key Laboratory for Multimodal Artificial Intelligence Systems,Beijing,China,100190"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Sciences,State Key Laboratory for Multimodal Artificial Intelligence Systems,Beijing,China,100190","institution_ids":["https://openalex.org/I4210094879","https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5136524313","display_name":"Ge Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ge Yang","raw_affiliation_strings":["Institute of Automation, Chinese Academy of Sciences,State Key Laboratory for Multimodal Artificial Intelligence Systems,Beijing,China,100190"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Sciences,State Key Laboratory for Multimodal Artificial Intelligence Systems,Beijing,China,100190","institution_ids":["https://openalex.org/I4210094879","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5136597156"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210094879"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.94006595,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13567","display_name":"AI and Multimedia in Education","score":0.13650000095367432,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13567","display_name":"AI and Multimedia in Education","score":0.13650000095367432,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.12759999930858612,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.0406000018119812,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.546999990940094},{"id":"https://openalex.org/keywords/frequency-domain","display_name":"Frequency domain","score":0.5281999707221985},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.4943000078201294},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4440999925136566},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4311999976634979},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.39750000834465027}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5921000242233276},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5848000049591064},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.546999990940094},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5335000157356262},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5297999978065491},{"id":"https://openalex.org/C19118579","wikidata":"https://www.wikidata.org/wiki/Q786423","display_name":"Frequency domain","level":2,"score":0.5281999707221985},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.4943000078201294},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4440999925136566},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4311999976634979},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.39750000834465027},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.35740000009536743},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.3336000144481659},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.3172000050544739},{"id":"https://openalex.org/C193536780","wikidata":"https://www.wikidata.org/wiki/Q1513153","display_name":"Edge detection","level":4,"score":0.2624000012874603},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.25540000200271606},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2513999938964844}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/isbi61048.2026.11515926","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isbi61048.2026.11515926","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE 23rd International Symposium on Biomedical Imaging (ISBI)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2840938334","display_name":null,"funder_award_id":"2024YFF0729202","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G7359957411","display_name":null,"funder_award_id":"92354307","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7363891303","display_name":null,"funder_award_id":"E3E45201X2","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W4313023779","https://openalex.org/W4377981744","https://openalex.org/W4385801610","https://openalex.org/W4386352593","https://openalex.org/W4387969595","https://openalex.org/W4388517067","https://openalex.org/W4393372396","https://openalex.org/W4401751460","https://openalex.org/W4402754006","https://openalex.org/W4402915568","https://openalex.org/W4405286907","https://openalex.org/W4408353081"],"related_works":[],"abstract_inverted_index":{"Medical":[0],"Small":[1],"Object":[2],"Detection":[3],"(MSOD)":[4],"can":[5],"assist":[6],"in":[7,22,25,33,94,133],"lesion":[8],"localization,":[9],"cell":[10],"identification,":[11],"and":[12,36,48,64,92,102,109,135],"drug":[13],"development.":[14],"While":[15],"deep":[16,68],"learning-based":[17],"methods":[18],"have":[19],"made":[20],"progress":[21],"this":[23],"field":[24],"recent":[26],"years,":[27],"they":[28],"still":[29],"face":[30],"significant":[31],"limitations":[32],"detection":[34],"accuracy":[35],"speed.":[37],"To":[38,53,86],"address":[39,54,87],"these":[40],"challenges,":[41],"we":[42,72,98],"propose":[43,73,99],"Multi-scale":[44,74],"frequency":[45],"domain":[46,76],"enhancement":[47],"Cross":[49,104],"attention":[50],"fusion":[51],"(MC-MSOD).":[52],"the":[55,82,88,119],"lack":[56],"of":[57,60,67,126],"spatial":[58],"sensitivity":[59],"small":[61,96],"target":[62],"features":[63,91],"insufficient":[65],"extraction":[66],"semantic":[69],"feature":[70],"information,":[71],"Frequency":[75],"Feature":[77],"Enhancement":[78],"(MFFE)":[79],"based":[80],"on":[81,118],"fast":[83],"fourier":[84],"transform.":[85],"sparse":[89],"positional":[90],"difficulty":[93],"modeling":[95],"targets,":[97],"Position":[100],"embedding":[101],"Channel":[103],"Attention":[105],"(PCCA).":[106],"Through":[107],"comprehensive":[108],"scientific":[110],"experimental":[111],"analysis,":[112],"compared":[113],"to":[114],"current":[115],"state-of-the-art":[116],"algorithms":[117],"public":[120],"BCCD":[121],"dataset,":[122],"MC-MSOD":[123],"demonstrates":[124],"improvements":[125],"<tex":[127],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[128],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$0.22":[129],"\\%,":[130],"1.47":[131],"\\%$</tex>":[132],"mAP@50":[134],"mAP@50-95,":[136],"respectively.":[137]},"counts_by_year":[],"updated_date":"2026-05-22T06:13:13.366637","created_date":"2026-05-21T00:00:00"}
