{"id":"https://openalex.org/W3197086755","doi":"https://doi.org/10.3390/rs13183555","title":"Real-Time Underwater Maritime Object Detection in Side-Scan Sonar Images Based on Transformer-YOLOv5","display_name":"Real-Time Underwater Maritime Object Detection in Side-Scan Sonar Images Based on Transformer-YOLOv5","publication_year":2021,"publication_date":"2021-09-07","ids":{"openalex":"https://openalex.org/W3197086755","doi":"https://doi.org/10.3390/rs13183555","mag":"3197086755"},"language":"en","primary_location":{"id":"doi:10.3390/rs13183555","is_oa":true,"landing_page_url":"https://doi.org/10.3390/rs13183555","pdf_url":"https://www.mdpi.com/2072-4292/13/18/3555/pdf?version=1631434124","source":{"id":"https://openalex.org/S43295729","display_name":"Remote Sensing","issn_l":"2072-4292","issn":["2072-4292"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Remote Sensing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2072-4292/13/18/3555/pdf?version=1631434124","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033822799","display_name":"Yongcan Yu","orcid":"https://orcid.org/0000-0002-8822-7781"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongcan Yu","raw_affiliation_strings":["Institute of Marine Science and Technology, Wuhan University, Wuhan 430079, China","School of Geodesy and Geomatics, Wuhan University, Wuhan 430079, China"],"affiliations":[{"raw_affiliation_string":"Institute of Marine Science and Technology, Wuhan University, Wuhan 430079, China","institution_ids":["https://openalex.org/I37461747"]},{"raw_affiliation_string":"School of Geodesy and Geomatics, Wuhan University, Wuhan 430079, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018332007","display_name":"Jianhu Zhao","orcid":"https://orcid.org/0000-0003-3796-8405"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jianhu Zhao","raw_affiliation_strings":["Institute of Marine Science and Technology, Wuhan University, Wuhan 430079, China","School of Geodesy and Geomatics, Wuhan University, Wuhan 430079, China"],"affiliations":[{"raw_affiliation_string":"Institute of Marine Science and Technology, Wuhan University, Wuhan 430079, China","institution_ids":["https://openalex.org/I37461747"]},{"raw_affiliation_string":"School of Geodesy and Geomatics, Wuhan University, Wuhan 430079, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074662062","display_name":"Quanhua Gong","orcid":null},"institutions":[{"id":"https://openalex.org/I4210130035","display_name":"China Communications Construction Company (China)","ror":"https://ror.org/03q3een69","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210130035"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Quanhua Gong","raw_affiliation_strings":["New Energy Engineering Limited Company of China Communications Construction Company Third Harbor Engineering Limited Company, Shanghai 200137, China"],"affiliations":[{"raw_affiliation_string":"New Energy Engineering Limited Company of China Communications Construction Company Third Harbor Engineering Limited Company, Shanghai 200137, China","institution_ids":["https://openalex.org/I4210130035"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080040279","display_name":"Chao Huang","orcid":"https://orcid.org/0000-0001-8611-7653"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chao Huang","raw_affiliation_strings":["Institute of Marine Science and Technology, Wuhan University, Wuhan 430079, China","School of Geodesy and Geomatics, Wuhan University, Wuhan 430079, China"],"affiliations":[{"raw_affiliation_string":"Institute of Marine Science and Technology, Wuhan University, Wuhan 430079, China","institution_ids":["https://openalex.org/I37461747"]},{"raw_affiliation_string":"School of Geodesy and Geomatics, Wuhan University, Wuhan 430079, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103202484","display_name":"Gen Zheng","orcid":"https://orcid.org/0000-0003-2841-526X"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gen Zheng","raw_affiliation_strings":["Institute of Marine Science and Technology, Wuhan University, Wuhan 430079, China","School of Geodesy and Geomatics, Wuhan University, Wuhan 430079, China"],"affiliations":[{"raw_affiliation_string":"Institute of Marine Science and Technology, Wuhan University, Wuhan 430079, China","institution_ids":["https://openalex.org/I37461747"]},{"raw_affiliation_string":"School of Geodesy and Geomatics, Wuhan University, Wuhan 430079, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5076030187","display_name":"Jinye Ma","orcid":"https://orcid.org/0000-0003-4655-0019"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinye Ma","raw_affiliation_strings":["Institute of Marine Science and Technology, Wuhan University, Wuhan 430079, China","School of Geodesy and Geomatics, Wuhan University, Wuhan 430079, China"],"affiliations":[{"raw_affiliation_string":"Institute of Marine Science and Technology, Wuhan University, Wuhan 430079, China","institution_ids":["https://openalex.org/I37461747"]},{"raw_affiliation_string":"School of Geodesy and Geomatics, Wuhan University, Wuhan 430079, China","institution_ids":["https://openalex.org/I37461747"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5018332007"],"corresponding_institution_ids":["https://openalex.org/I37461747"],"apc_list":{"value":2500,"currency":"CHF","value_usd":2707},"apc_paid":{"value":2500,"currency":"CHF","value_usd":2707},"fwci":15.6318,"has_fulltext":false,"cited_by_count":229,"citation_normalized_percentile":{"value":0.99411793,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":100},"biblio":{"volume":"13","issue":"18","first_page":"3555","last_page":"3555"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11698","display_name":"Underwater Acoustics Research","score":0.9891999959945679,"subfield":{"id":"https://openalex.org/subfields/1910","display_name":"Oceanography"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9746000170707703,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7957097291946411},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.7504686117172241},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7246946692466736},{"id":"https://openalex.org/keywords/underwater","display_name":"Underwater","score":0.6862913966178894},{"id":"https://openalex.org/keywords/side-scan-sonar","display_name":"Side-scan sonar","score":0.674704909324646},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6322934627532959},{"id":"https://openalex.org/keywords/sonar","display_name":"Sonar","score":0.5518867373466492},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5040318369865417},{"id":"https://openalex.org/keywords/automatic-target-recognition","display_name":"Automatic target recognition","score":0.45263776183128357},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.41631433367729187},{"id":"https://openalex.org/keywords/synthetic-aperture-radar","display_name":"Synthetic aperture radar","score":0.14843130111694336},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.0959337055683136},{"id":"https://openalex.org/keywords/geology","display_name":"Geology","score":0.07347691059112549}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7957097291946411},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.7504686117172241},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7246946692466736},{"id":"https://openalex.org/C98083399","wikidata":"https://www.wikidata.org/wiki/Q3246517","display_name":"Underwater","level":2,"score":0.6862913966178894},{"id":"https://openalex.org/C2776355146","wikidata":"https://www.wikidata.org/wiki/Q357527","display_name":"Side-scan sonar","level":3,"score":0.674704909324646},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6322934627532959},{"id":"https://openalex.org/C555745239","wikidata":"https://www.wikidata.org/wiki/Q133220","display_name":"Sonar","level":2,"score":0.5518867373466492},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5040318369865417},{"id":"https://openalex.org/C117623542","wikidata":"https://www.wikidata.org/wiki/Q621974","display_name":"Automatic target recognition","level":3,"score":0.45263776183128357},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.41631433367729187},{"id":"https://openalex.org/C87360688","wikidata":"https://www.wikidata.org/wiki/Q740686","display_name":"Synthetic aperture radar","level":2,"score":0.14843130111694336},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0959337055683136},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.07347691059112549},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C111368507","wikidata":"https://www.wikidata.org/wiki/Q43518","display_name":"Oceanography","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.3390/rs13183555","is_oa":true,"landing_page_url":"https://doi.org/10.3390/rs13183555","pdf_url":"https://www.mdpi.com/2072-4292/13/18/3555/pdf?version=1631434124","source":{"id":"https://openalex.org/S43295729","display_name":"Remote Sensing","issn_l":"2072-4292","issn":["2072-4292"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Remote Sensing","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:85d4fdeabcd748a9914d572c767bf7ff","is_oa":true,"landing_page_url":"https://doaj.org/article/85d4fdeabcd748a9914d572c767bf7ff","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Remote Sensing, Vol 13, Iss 18, p 3555 (2021)","raw_type":"article"},{"id":"pmh:oai:mdpi.com:/2072-4292/13/18/3555/","is_oa":true,"landing_page_url":"https://dx.doi.org/10.3390/rs13183555","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Remote Sensing; Volume 13; Issue 18; Pages: 3555","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.3390/rs13183555","is_oa":true,"landing_page_url":"https://doi.org/10.3390/rs13183555","pdf_url":"https://www.mdpi.com/2072-4292/13/18/3555/pdf?version=1631434124","source":{"id":"https://openalex.org/S43295729","display_name":"Remote Sensing","issn_l":"2072-4292","issn":["2072-4292"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Remote Sensing","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/14","score":0.8399999737739563,"display_name":"Life below water"}],"awards":[{"id":"https://openalex.org/G7061156634","display_name":null,"funder_award_id":"41376109","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8687962759","display_name":null,"funder_award_id":"41576107","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3197086755.pdf","grobid_xml":"https://content.openalex.org/works/W3197086755.grobid-xml"},"referenced_works_count":32,"referenced_works":["https://openalex.org/W1836465849","https://openalex.org/W1968898624","https://openalex.org/W1975194708","https://openalex.org/W2118652164","https://openalex.org/W2342423581","https://openalex.org/W2565639579","https://openalex.org/W2736627027","https://openalex.org/W2740333758","https://openalex.org/W2791767745","https://openalex.org/W2908524565","https://openalex.org/W2912160656","https://openalex.org/W2943210864","https://openalex.org/W2944829497","https://openalex.org/W2962834855","https://openalex.org/W2963857746","https://openalex.org/W2969567505","https://openalex.org/W2993483871","https://openalex.org/W2996325784","https://openalex.org/W2997682172","https://openalex.org/W3009376633","https://openalex.org/W3025003426","https://openalex.org/W3042011474","https://openalex.org/W3044621282","https://openalex.org/W3094550093","https://openalex.org/W3106608482","https://openalex.org/W3109637960","https://openalex.org/W3130684229","https://openalex.org/W3132971810","https://openalex.org/W3163324518","https://openalex.org/W6739901393","https://openalex.org/W6762853333","https://openalex.org/W6786532315"],"related_works":["https://openalex.org/W1921505891","https://openalex.org/W2897910144","https://openalex.org/W2114161718","https://openalex.org/W1572693489","https://openalex.org/W2415693547","https://openalex.org/W2888512610","https://openalex.org/W2099932270","https://openalex.org/W2890449065","https://openalex.org/W855818946","https://openalex.org/W2547343994"],"abstract_inverted_index":{"To":[0],"overcome":[1],"the":[2,5,40,53,73,79,83,95,116,124],"shortcomings":[3],"of":[4,9,32,39,58,85,128],"traditional":[6],"manual":[7],"detection":[8],"underwater":[10,90],"targets":[11],"in":[12,26,78],"side-scan":[13],"sonar":[14],"(SSS)":[15],"images,":[16,60],"a":[17,61,66],"real-time":[18,125],"automatic":[19],"target":[20,49,91],"recognition":[21,126],"(ATR)":[22],"method":[23,30,80,97],"is":[24,76],"proposed":[25,96],"this":[27],"paper.":[28],"This":[29],"consists":[31],"image":[33],"preprocessing,":[34],"sampling,":[35],"ATR":[36],"by":[37],"integration":[38],"transformer":[41],"module":[42],"and":[43,48,55,65,72,87,104,108,111,122],"YOLOv5s":[44,117],"(that":[45],"is,":[46],"TR\u2013YOLOv5s),":[47],"localization.":[50],"By":[51],"considering":[52],"target-sparse":[54],"feature-barren":[56],"characteristics":[57],"SSS":[59],"novel":[62],"TR\u2013YOLOv5s":[63],"network":[64,118],"down-sampling":[67],"principle":[68],"are":[69],"put":[70],"forward,":[71],"attention":[74],"mechanism":[75],"introduced":[77],"to":[81],"meet":[82],"requirements":[84],"accuracy":[86],"efficiency":[88],"for":[89],"recognition.":[92],"Experiments":[93],"verified":[94],"achieved":[98],"85.6%":[99],"mean":[100],"average":[101],"precision":[102],"(mAP)":[103],"87.8%":[105],"macro-F2":[106],"score,":[107],"brought":[109],"12.5%":[110],"10.6%":[112],"gains":[113],"compared":[114],"with":[115],"trained":[119],"from":[120],"scratch,":[121],"had":[123],"speed":[127],"about":[129],"0.068":[130],"s":[131],"per":[132],"image.":[133]},"counts_by_year":[{"year":2026,"cited_by_count":13},{"year":2025,"cited_by_count":55},{"year":2024,"cited_by_count":60},{"year":2023,"cited_by_count":62},{"year":2022,"cited_by_count":36},{"year":2021,"cited_by_count":3}],"updated_date":"2026-04-06T07:47:59.780226","created_date":"2021-09-13T00:00:00"}
