{"id":"https://openalex.org/W7147393145","doi":"https://doi.org/10.1109/icvisp68610.2025.11451686","title":"IRSO-YOLO: An Improved Infrared Small Object Detection Algorithm Based on YOLOv8","display_name":"IRSO-YOLO: An Improved Infrared Small Object Detection Algorithm Based on YOLOv8","publication_year":2025,"publication_date":"2025-11-28","ids":{"openalex":"https://openalex.org/W7147393145","doi":"https://doi.org/10.1109/icvisp68610.2025.11451686"},"language":null,"primary_location":{"id":"doi:10.1109/icvisp68610.2025.11451686","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icvisp68610.2025.11451686","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 9th International Conference on Vision, Image and Signal Processing (ICVISP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132702955","display_name":"Zhongpin Niu","orcid":null},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhongpin Niu","raw_affiliation_strings":["Xi&#x2019;an Jiaotong University,College of Artificial Intelligence,Xi&#x2019;an,China"],"affiliations":[{"raw_affiliation_string":"Xi&#x2019;an Jiaotong University,College of Artificial Intelligence,Xi&#x2019;an,China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100623510","display_name":"Ping Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peng Yu","raw_affiliation_strings":["Xi&#x2019;an Jiaotong University,College of Artificial Intelligence,Xi&#x2019;an,China"],"affiliations":[{"raw_affiliation_string":"Xi&#x2019;an Jiaotong University,College of Artificial Intelligence,Xi&#x2019;an,China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065267589","display_name":"Long He","orcid":"https://orcid.org/0000-0002-4442-728X"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Longfei He","raw_affiliation_strings":["Xi&#x2019;an Jiaotong University,College of Artificial Intelligence,Xi&#x2019;an,China"],"affiliations":[{"raw_affiliation_string":"Xi&#x2019;an Jiaotong University,College of Artificial Intelligence,Xi&#x2019;an,China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044561987","display_name":"Xuchong Zhang","orcid":"https://orcid.org/0000-0003-2772-2700"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuchong Zhang","raw_affiliation_strings":["Xi&#x2019;an Jiaotong University,College of Artificial Intelligence,Xi&#x2019;an,China"],"affiliations":[{"raw_affiliation_string":"Xi&#x2019;an Jiaotong University,College of Artificial Intelligence,Xi&#x2019;an,China","institution_ids":["https://openalex.org/I87445476"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5132702955"],"corresponding_institution_ids":["https://openalex.org/I87445476"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.75346672,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.5375999808311462,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.5375999808311462,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12389","display_name":"Infrared Target Detection Methodologies","score":0.18019999563694,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11856","display_name":"Thermography and Photoacoustic Techniques","score":0.037700001150369644,"subfield":{"id":"https://openalex.org/subfields/2211","display_name":"Mechanics of Materials"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.728600025177002},{"id":"https://openalex.org/keywords/infrared","display_name":"Infrared","score":0.6955000162124634},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6790000200271606},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5838000178337097},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5349000096321106},{"id":"https://openalex.org/keywords/contrast","display_name":"Contrast (vision)","score":0.47290000319480896},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4496999979019165},{"id":"https://openalex.org/keywords/saliency-map","display_name":"Saliency map","score":0.34470000863075256}],"concepts":[{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.728600025177002},{"id":"https://openalex.org/C158355884","wikidata":"https://www.wikidata.org/wiki/Q11388","display_name":"Infrared","level":2,"score":0.6955000162124634},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6790000200271606},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6510000228881836},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6489999890327454},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5838000178337097},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5349000096321106},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5175999999046326},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.47290000319480896},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4643000066280365},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4496999979019165},{"id":"https://openalex.org/C2779679900","wikidata":"https://www.wikidata.org/wiki/Q25304431","display_name":"Saliency map","level":3,"score":0.34470000863075256},{"id":"https://openalex.org/C169903167","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Test set","level":2,"score":0.3176000118255615},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3172999918460846},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2865000069141388},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.28540000319480896},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.2745000123977661},{"id":"https://openalex.org/C106516650","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm design","level":2,"score":0.27090001106262207},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.2703999876976013},{"id":"https://openalex.org/C126422989","wikidata":"https://www.wikidata.org/wiki/Q93586","display_name":"Feature detection (computer vision)","level":4,"score":0.26249998807907104}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icvisp68610.2025.11451686","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icvisp68610.2025.11451686","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 9th International Conference on Vision, Image and Signal Processing (ICVISP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W2102605133","https://openalex.org/W2752782242","https://openalex.org/W2963163009","https://openalex.org/W3110751712","https://openalex.org/W3207919963","https://openalex.org/W3217173240","https://openalex.org/W4225315053","https://openalex.org/W4318695031","https://openalex.org/W4323317962","https://openalex.org/W4366598917","https://openalex.org/W4386076325","https://openalex.org/W4390638237","https://openalex.org/W4394858325","https://openalex.org/W4408467392"],"related_works":[],"abstract_inverted_index":{"Infrared":[0],"images":[1],"are":[2],"characterized":[3],"by":[4,114],"low":[5,8],"contrast":[6],"and":[7,62,94,98,105,140],"signal-to-noise":[9],"ratios,":[10],"particularly":[11],"for":[12,48,103],"small":[13,27,50],"objects,":[14,107],"which":[15,53,135],"lack":[16],"distinct":[17],"features":[18],"in":[19,89,101,143],"infrared":[20,26,49],"images,":[21],"making":[22],"the":[23,59,71,78,82,92,111,118],"detection":[24,55,123,130],"of":[25,81,96,132],"object":[28,51],"a":[29,86],"significant":[30],"challenge.":[31],"To":[32],"alleviate":[33],"these":[34],"issues,":[35],"based":[36],"on":[37,77,125],"YOLOv8":[38],"algorithm,":[39],"this":[40],"paper":[41],"proposes":[42],"an":[43,64],"improved":[44,119],"algorithm":[45,120],"named":[46],"IRSO-YOLO":[47,72],"detection,":[52],"enhanced":[54],"performance":[56,124],"through":[57],"optimizing":[58],"feature":[60],"scales":[61],"integrating":[63],"SEAttention":[65],"module.":[66],"Experimental":[67],"results":[68],"demonstrate":[69],"that":[70],"outperforms":[73],"other":[74],"classic":[75],"algorithms":[76],"test":[79],"set":[80],"HIT-UAV":[83],"dataset,":[84],"with":[85],"3.2%":[87],"increase":[88],"mAP50":[90],"over":[91],"baseline,":[93],"increases":[95],"2.3%":[97],"$13.5":[99],"\\%$":[100],"AP50":[102],"Tiny":[104],"Small":[106],"respectively,":[108],"while":[109],"reducing":[110],"model\u2019s":[112],"Params":[113],"$69.4":[115],"\\%$.":[116],"Additionally,":[117],"demonstrates":[121],"excellent":[122],"embedded":[126],"platform,":[127],"achieving":[128],"real-time":[129],"effect":[131],"31.4":[133],"FPS,":[134],"proves":[136],"its":[137],"application":[138],"potential":[139],"high":[141],"efficiency":[142],"real":[144],"environment.":[145]},"counts_by_year":[],"updated_date":"2026-04-02T13:53:19.096889","created_date":"2026-04-02T00:00:00"}
