{"id":"https://openalex.org/W4321094182","doi":"https://doi.org/10.3390/rs15041076","title":"HTDet: A Hybrid Transformer-Based Approach for Underwater Small Object Detection","display_name":"HTDet: A Hybrid Transformer-Based Approach for Underwater Small Object Detection","publication_year":2023,"publication_date":"2023-02-16","ids":{"openalex":"https://openalex.org/W4321094182","doi":"https://doi.org/10.3390/rs15041076"},"language":"en","primary_location":{"id":"doi:10.3390/rs15041076","is_oa":true,"landing_page_url":"https://doi.org/10.3390/rs15041076","pdf_url":"https://www.mdpi.com/2072-4292/15/4/1076/pdf?version=1676529817","source":{"id":"https://openalex.org/S43295729","display_name":"Remote Sensing","issn_l":"2072-4292","issn":["2072-4292"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Remote Sensing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2072-4292/15/4/1076/pdf?version=1676529817","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035568063","display_name":"Gangqi Chen","orcid":"https://orcid.org/0000-0001-8118-4515"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gangqi Chen","raw_affiliation_strings":["School of Marine Science and Technology, Northwestern Polytechnical University, Xi\u2019an 710072, China","School of Marine Science and Technology, Northwestern Polytechnical University, Xi'an 710072, China"],"affiliations":[{"raw_affiliation_string":"School of Marine Science and Technology, Northwestern Polytechnical University, Xi\u2019an 710072, China","institution_ids":["https://openalex.org/I17145004"]},{"raw_affiliation_string":"School of Marine Science and Technology, Northwestern Polytechnical University, Xi'an 710072, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068625837","display_name":"Zhaoyong Mao","orcid":"https://orcid.org/0000-0001-5746-6133"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhaoyong Mao","raw_affiliation_strings":["Unmanned System Research Institute, Northwestern Polytechnical University, Xi\u2019an 710072, China","Unmanned System Research Institute, Northwestern Polytechnical University, Xi'an 710072, China"],"affiliations":[{"raw_affiliation_string":"Unmanned System Research Institute, Northwestern Polytechnical University, Xi\u2019an 710072, China","institution_ids":["https://openalex.org/I17145004"]},{"raw_affiliation_string":"Unmanned System Research Institute, Northwestern Polytechnical University, Xi'an 710072, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100766804","display_name":"Kai Wang","orcid":"https://orcid.org/0000-0001-5589-7060"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kai Wang","raw_affiliation_strings":["Henan Key Laboratory of Underwater Intelligent Equipment, Zhengzhou 710072, China"],"affiliations":[{"raw_affiliation_string":"Henan Key Laboratory of Underwater Intelligent Equipment, Zhengzhou 710072, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5081646661","display_name":"Junge Shen","orcid":"https://orcid.org/0000-0002-6563-9206"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Junge Shen","raw_affiliation_strings":["Unmanned System Research Institute, Northwestern Polytechnical University, Xi\u2019an 710072, China","Unmanned System Research Institute, Northwestern Polytechnical University, Xi'an 710072, China"],"affiliations":[{"raw_affiliation_string":"Unmanned System Research Institute, Northwestern Polytechnical University, Xi\u2019an 710072, China","institution_ids":["https://openalex.org/I17145004"]},{"raw_affiliation_string":"Unmanned System Research Institute, Northwestern Polytechnical University, Xi'an 710072, China","institution_ids":["https://openalex.org/I17145004"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5081646661"],"corresponding_institution_ids":["https://openalex.org/I17145004"],"apc_list":{"value":2500,"currency":"CHF","value_usd":2707},"apc_paid":{"value":2500,"currency":"CHF","value_usd":2707},"fwci":5.4553,"has_fulltext":true,"cited_by_count":46,"citation_normalized_percentile":{"value":0.96993541,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"15","issue":"4","first_page":"1076","last_page":"1076"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12389","display_name":"Infrared Target Detection Methodologies","score":0.9872999787330627,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7747551202774048},{"id":"https://openalex.org/keywords/underwater","display_name":"Underwater","score":0.7299172282218933},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5966693162918091},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.537283718585968},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5165459513664246},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.4948062300682068},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.45505577325820923},{"id":"https://openalex.org/keywords/detector","display_name":"Detector","score":0.4378122389316559},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4226638078689575},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.3947374224662781},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.346940279006958},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.22065013647079468},{"id":"https://openalex.org/keywords/geology","display_name":"Geology","score":0.12603607773780823},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.12075173854827881},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.08928772807121277},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07724040746688843}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7747551202774048},{"id":"https://openalex.org/C98083399","wikidata":"https://www.wikidata.org/wiki/Q3246517","display_name":"Underwater","level":2,"score":0.7299172282218933},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5966693162918091},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.537283718585968},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5165459513664246},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.4948062300682068},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.45505577325820923},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.4378122389316559},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4226638078689575},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.3947374224662781},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.346940279006958},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.22065013647079468},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.12603607773780823},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.12075173854827881},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.08928772807121277},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07724040746688843},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C111368507","wikidata":"https://www.wikidata.org/wiki/Q43518","display_name":"Oceanography","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.3390/rs15041076","is_oa":true,"landing_page_url":"https://doi.org/10.3390/rs15041076","pdf_url":"https://www.mdpi.com/2072-4292/15/4/1076/pdf?version=1676529817","source":{"id":"https://openalex.org/S43295729","display_name":"Remote Sensing","issn_l":"2072-4292","issn":["2072-4292"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Remote Sensing","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:6178615cc5744b8e9699c50e64ec4114","is_oa":true,"landing_page_url":"https://doaj.org/article/6178615cc5744b8e9699c50e64ec4114","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Remote Sensing, Vol 15, Iss 4, p 1076 (2023)","raw_type":"article"},{"id":"pmh:oai:mdpi.com:/2072-4292/15/4/1076/","is_oa":true,"landing_page_url":"https://dx.doi.org/10.3390/rs15041076","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Remote Sensing","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.3390/rs15041076","is_oa":true,"landing_page_url":"https://doi.org/10.3390/rs15041076","pdf_url":"https://www.mdpi.com/2072-4292/15/4/1076/pdf?version=1676529817","source":{"id":"https://openalex.org/S43295729","display_name":"Remote Sensing","issn_l":"2072-4292","issn":["2072-4292"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Remote Sensing","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Life below water","score":0.8299999833106995,"id":"https://metadata.un.org/sdg/14"}],"awards":[{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1231421488","display_name":null,"funder_award_id":"under","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G391238517","display_name":null,"funder_award_id":", and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4640338107","display_name":null,"funder_award_id":"Technology","funder_id":"https://openalex.org/F4320309475","funder_display_name":"Northwestern University"},{"id":"https://openalex.org/G5939423041","display_name":null,"funder_award_id":"Technology","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8621529372","display_name":null,"funder_award_id":"61603233","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320309475","display_name":"Northwestern University","ror":"https://ror.org/000e0be47"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321392","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4321094182.pdf"},"referenced_works_count":56,"referenced_works":["https://openalex.org/W1483870316","https://openalex.org/W1861492603","https://openalex.org/W2193145675","https://openalex.org/W2531409750","https://openalex.org/W2565639579","https://openalex.org/W2613718673","https://openalex.org/W2751481876","https://openalex.org/W2769400802","https://openalex.org/W2790284570","https://openalex.org/W2925359305","https://openalex.org/W2953303055","https://openalex.org/W2954996726","https://openalex.org/W2962721361","https://openalex.org/W2963163009","https://openalex.org/W2963351448","https://openalex.org/W2964093967","https://openalex.org/W2966501856","https://openalex.org/W2989676862","https://openalex.org/W2991100582","https://openalex.org/W2993483871","https://openalex.org/W2995139153","https://openalex.org/W3013211776","https://openalex.org/W3015543858","https://openalex.org/W3035396860","https://openalex.org/W3063016731","https://openalex.org/W3094046575","https://openalex.org/W3096609285","https://openalex.org/W3096998908","https://openalex.org/W3097028850","https://openalex.org/W3103294617","https://openalex.org/W3106250896","https://openalex.org/W3107867277","https://openalex.org/W3122799380","https://openalex.org/W3158715390","https://openalex.org/W3159459366","https://openalex.org/W3172752666","https://openalex.org/W3172759799","https://openalex.org/W3179888767","https://openalex.org/W3185014437","https://openalex.org/W3193027989","https://openalex.org/W3209499093","https://openalex.org/W3214181264","https://openalex.org/W3217445779","https://openalex.org/W4200300735","https://openalex.org/W4200495849","https://openalex.org/W4206294875","https://openalex.org/W4206545193","https://openalex.org/W4210958248","https://openalex.org/W4220691786","https://openalex.org/W4221132539","https://openalex.org/W4228998801","https://openalex.org/W4285107695","https://openalex.org/W4293215762","https://openalex.org/W4313030791","https://openalex.org/W4313506322","https://openalex.org/W6784434877"],"related_works":["https://openalex.org/W4388412763","https://openalex.org/W3125011624","https://openalex.org/W1508631387","https://openalex.org/W2591930867","https://openalex.org/W2370917603","https://openalex.org/W4206178588","https://openalex.org/W4287635093","https://openalex.org/W3094491777","https://openalex.org/W3214715529","https://openalex.org/W4315498985"],"abstract_inverted_index":{"As":[0],"marine":[1,33],"observation":[2],"technology":[3],"develops":[4],"rapidly,":[5],"underwater":[6,74],"optical":[7,40],"image":[8],"object":[9,75],"detection":[10,76],"is":[11,58,83,91,105,119,137],"beginning":[12],"to":[13,49,64,107,139,162],"occupy":[14],"an":[15,39,146],"important":[16],"role":[17],"in":[18,30,145],"many":[19],"tasks,":[20,26],"such":[21,56],"as":[22],"naval":[23],"coastal":[24],"defense":[25],"aquaculture,":[27],"etc.":[28],"However,":[29],"the":[31,35,109,116,132,156,164,169,179,186],"complex":[32],"environment,":[34],"images":[36],"captured":[37],"by":[38,171,182,191],"imaging":[41],"system":[42],"are":[43,189],"usually":[44],"severely":[45],"degraded.":[46],"Therefore,":[47],"how":[48],"detect":[50,140],"objects":[51,144],"accurately":[52],"and":[53,142,148,168,185],"quickly":[54],"under":[55],"conditions":[57],"a":[59,70,79,86,100,172],"critical":[60],"problem":[61],"that":[62,93,131],"needs":[63],"be":[65],"solved.":[66],"In":[67],"this":[68],"manuscript,":[69],"novel":[71],"framework":[72],"for":[73,121],"based":[77],"on":[78],"hybrid":[80,88],"transformer":[81],"network":[82,90,104],"proposed.":[84],"First,":[85],"lightweight":[87],"transformer-based":[89],"presented":[92],"can":[94],"extract":[95],"global":[96],"contextual":[97],"information.":[98],"Second,":[99],"fine-grained":[101],"feature":[102],"pyramid":[103],"used":[106],"overcome":[108],"issues":[110],"of":[111,166],"feeble":[112,141],"signal":[113],"disappearance.":[114],"Third,":[115],"test-time-augmentation":[117],"method":[118],"applied":[120],"inference":[122],"without":[123],"introducing":[124],"additional":[125],"parameters.":[126],"Extensive":[127],"experiments":[128],"have":[129,135],"shown":[130],"approach":[133],"we":[134],"proposed":[136],"able":[138],"small":[143],"efficient":[147],"effective":[149],"way.":[150],"Furthermore,":[151],"our":[152,176],"model":[153,181,187],"significantly":[154],"outperforms":[155,178],"latest":[157],"advanced":[158],"detectors":[159],"with":[160],"respect":[161],"both":[163],"number":[165],"parameters":[167,188],"mAP":[170],"considerable":[173],"margin.":[174],"Specifically,":[175],"detector":[177],"baseline":[180],"6.3":[183],"points,":[184],"reduced":[190],"28.5":[192],"M.":[193]},"counts_by_year":[{"year":2026,"cited_by_count":7},{"year":2025,"cited_by_count":18},{"year":2024,"cited_by_count":19},{"year":2023,"cited_by_count":2}],"updated_date":"2026-04-19T08:26:33.389920","created_date":"2025-10-10T00:00:00"}
