{"id":"https://openalex.org/W7151884698","doi":"https://doi.org/10.48550/arxiv.2604.05363","title":"Rethinking IRSTD: Single-Point Supervision Guided Encoder-only Framework is Enough for Infrared Small Target Detection","display_name":"Rethinking IRSTD: Single-Point Supervision Guided Encoder-only Framework is Enough for Infrared Small Target Detection","publication_year":2026,"publication_date":"2026-04-07","ids":{"openalex":"https://openalex.org/W7151884698","doi":"https://doi.org/10.48550/arxiv.2604.05363"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.05363","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05363","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.05363","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133155660","display_name":"Rixiang Ni","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ni, Rixiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133206481","display_name":"Boyang Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Boyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133212830","display_name":"Jun Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Jun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084265344","display_name":"Yonghao Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Yonghao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133201964","display_name":"Feiyu Ren","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ren, Feiyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126685924","display_name":"Yuji Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yuji","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133183549","display_name":"Haoyang Yuan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuan, Haoyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133195584","display_name":"Wujiao He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Wujiao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133151175","display_name":"Wei An","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"An, Wei","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5133155660"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12389","display_name":"Infrared Target Detection Methodologies","score":0.8948000073432922,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12389","display_name":"Infrared Target Detection Methodologies","score":0.8948000073432922,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.02630000002682209,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11637","display_name":"Advanced Semiconductor Detectors and Materials","score":0.010099999606609344,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.7347000241279602},{"id":"https://openalex.org/keywords/clutter","display_name":"Clutter","score":0.7181000113487244},{"id":"https://openalex.org/keywords/false-alarm","display_name":"False alarm","score":0.5127999782562256},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.4927999973297119},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.4830000102519989},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.4805999994277954},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.4620000123977661},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.45179998874664307},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.4480000138282776},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4440000057220459}],"concepts":[{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.7347000241279602},{"id":"https://openalex.org/C132094186","wikidata":"https://www.wikidata.org/wiki/Q641585","display_name":"Clutter","level":3,"score":0.7181000113487244},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6800000071525574},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6626999974250793},{"id":"https://openalex.org/C2776836416","wikidata":"https://www.wikidata.org/wiki/Q1364844","display_name":"False alarm","level":2,"score":0.5127999782562256},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.4927999973297119},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.4830000102519989},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.4805999994277954},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.4620000123977661},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4607999920845032},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.45179998874664307},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.4480000138282776},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4440000057220459},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4156999886035919},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.4092999994754791},{"id":"https://openalex.org/C77052588","wikidata":"https://www.wikidata.org/wiki/Q644307","display_name":"Constant false alarm rate","level":2,"score":0.4047999978065491},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.40209999680519104},{"id":"https://openalex.org/C2778949103","wikidata":"https://www.wikidata.org/wiki/Q600717","display_name":"Staring","level":2,"score":0.39649999141693115},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.38350000977516174},{"id":"https://openalex.org/C2779726219","wikidata":"https://www.wikidata.org/wiki/Q7685884","display_name":"Target acquisition","level":2,"score":0.3630000054836273},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.35420000553131104},{"id":"https://openalex.org/C62354387","wikidata":"https://www.wikidata.org/wiki/Q875399","display_name":"Boundary (topology)","level":2,"score":0.3206999897956848},{"id":"https://openalex.org/C146599234","wikidata":"https://www.wikidata.org/wiki/Q511093","display_name":"Centroid","level":2,"score":0.3118000030517578},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.3012999892234802},{"id":"https://openalex.org/C117623542","wikidata":"https://www.wikidata.org/wiki/Q621974","display_name":"Automatic target recognition","level":3,"score":0.28610000014305115},{"id":"https://openalex.org/C2778857364","wikidata":"https://www.wikidata.org/wiki/Q974850","display_name":"Missile","level":2,"score":0.2842999994754791},{"id":"https://openalex.org/C158355884","wikidata":"https://www.wikidata.org/wiki/Q11388","display_name":"Infrared","level":2,"score":0.2831999957561493},{"id":"https://openalex.org/C2779803651","wikidata":"https://www.wikidata.org/wiki/Q5282088","display_name":"Discriminator","level":3,"score":0.2768999934196472},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.27399998903274536},{"id":"https://openalex.org/C2778775528","wikidata":"https://www.wikidata.org/wiki/Q5135432","display_name":"Closing (real estate)","level":2,"score":0.27149999141693115},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.2702000141143799},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.2639999985694885},{"id":"https://openalex.org/C171268870","wikidata":"https://www.wikidata.org/wiki/Q1486676","display_name":"GRASP","level":2,"score":0.2565000057220459}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.05363","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05363","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.05363","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05363","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Infrared":[0,97],"small":[1,8,34],"target":[2,66,72,171],"detection":[3,190],"(IRSTD)":[4],"aims":[5],"to":[6,17,109],"separate":[7],"targets":[9,35],"from":[10],"clutter":[11,50],"backgrounds.":[12,51],"Extensive":[13],"research":[14],"is":[15,105,205],"dedicated":[16],"the":[18,31,59,110],"pixel-level":[19],"supervision-guided":[20],"\"encoder-decoder\"":[21],"segmentation":[22],"paradigm.":[23],"Although":[24],"having":[25],"achieved":[26],"promising":[27],"performance,":[28],"they":[29],"neglect":[30],"fact":[32],"that":[33,58,148,185],"only":[36],"occupy":[37],"a":[38,86,92,123,143],"few":[39],"pixels":[40],"and":[41,90,116,160,182,199],"are":[42],"usually":[43],"accompanied":[44,74],"with":[45,75,137,142,192],"blurred":[46],"boundary":[47],"caused":[48],"by":[49],"Based":[52],"on":[53,176],"this":[54,80],"observation,":[55],"we":[56,82,120],"argue":[57],"first":[60,121],"principle":[61],"of":[62,69],"IRSTD":[63,84,178],"should":[64],"be":[65],"localization":[67],"instead":[68],"separating":[70],"all":[71],"region":[73],"indistinguishable":[76],"background":[77],"noise.":[78],"In":[79],"paper,":[81],"reformulate":[83],"as":[85],"centroid":[87],"regression":[88,152],"task":[89],"propose":[91],"novel":[93],"Single-Point":[94],"Supervision":[95,126],"guided":[96],"Probabilistic":[98,145],"Response":[99],"Encoding":[100],"method":[101],"(namely,":[102],"SPIRE),":[103],"which":[104,128],"indeed":[106],"challenging":[107],"due":[108],"mismatch":[111],"between":[112],"reduced":[113,201],"supervision":[114,163],"network":[115],"equivalent":[117],"output.":[118],"Specifically,":[119],"design":[122],"Point-Response":[124],"Prior":[125],"(PRPS),":[127],"transforms":[129],"single-point":[130],"annotations":[131],"into":[132],"probabilistic":[133],"response":[134,140],"map":[135],"consistent":[136],"infrared":[138],"point-target":[139],"characteristics,":[141],"High-Resolution":[144],"Encoder":[146],"(HRPE)":[147],"enables":[149],"encoder-only,":[150],"end-to-end":[151],"without":[153],"decoder":[154],"reconstruction.":[155],"By":[156],"preserving":[157],"high-resolution":[158],"features":[159],"increasing":[161],"effective":[162],"density,":[164],"SPIRE":[165,186],"alleviates":[166],"optimization":[167],"instability":[168],"under":[169],"sparse":[170],"distributions.":[172],"Finally,":[173],"extensive":[174],"experiments":[175],"various":[177],"benchmarks,":[179],"including":[180],"SIRST-UAVB":[181],"SIRST4":[183],"demonstrate":[184],"achieves":[187],"competitive":[188],"target-level":[189],"performance":[191],"consistently":[193],"low":[194],"false":[195],"alarm":[196],"rate":[197],"(Fa)":[198],"significantly":[200],"computational":[202],"cost.":[203],"Code":[204],"publicly":[206],"available":[207],"at:":[208],"https://github.com/NIRIXIANG/SPIRE-IRSTD.":[209]},"counts_by_year":[],"updated_date":"2026-04-09T06:13:59.934233","created_date":"2026-04-09T00:00:00"}
