{"id":"https://openalex.org/W4406860686","doi":"https://doi.org/10.1109/apsipaasc63619.2025.10849095","title":"AFSDet: Video Small Object Detection Based on Adaptive Focused Slicing","display_name":"AFSDet: Video Small Object Detection Based on Adaptive Focused Slicing","publication_year":2024,"publication_date":"2024-12-03","ids":{"openalex":"https://openalex.org/W4406860686","doi":"https://doi.org/10.1109/apsipaasc63619.2025.10849095"},"language":"en","primary_location":{"id":"doi:10.1109/apsipaasc63619.2025.10849095","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc63619.2025.10849095","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015222818","display_name":"Kangjian Huang","orcid":"https://orcid.org/0009-0003-3694-7191"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Kangjian Huang","raw_affiliation_strings":["Southwest Jiaotong University,School of Computing and Artificial Intelligence,Chengdu,China"],"affiliations":[{"raw_affiliation_string":"Southwest Jiaotong University,School of Computing and Artificial Intelligence,Chengdu,China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068760974","display_name":"Yan Yang","orcid":"https://orcid.org/0000-0001-5719-043X"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yan Yang","raw_affiliation_strings":["Southwest Jiaotong University,School of Computing and Artificial Intelligence,Chengdu,China"],"affiliations":[{"raw_affiliation_string":"Southwest Jiaotong University,School of Computing and Artificial Intelligence,Chengdu,China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060855407","display_name":"Yongquan Jiang","orcid":"https://orcid.org/0000-0003-1651-595X"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongquan Jiang","raw_affiliation_strings":["Southwest Jiaotong University,School of Computing and Artificial Intelligence,Chengdu,China"],"affiliations":[{"raw_affiliation_string":"Southwest Jiaotong University,School of Computing and Artificial Intelligence,Chengdu,China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056120706","display_name":"Xiaobo Zhang","orcid":"https://orcid.org/0000-0002-6598-0519"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaobo Zhang","raw_affiliation_strings":["Southwest Jiaotong University,School of Computing and Artificial Intelligence,Chengdu,China"],"affiliations":[{"raw_affiliation_string":"Southwest Jiaotong University,School of Computing and Artificial Intelligence,Chengdu,China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5026173981","display_name":"Zhuyi Angelina Li","orcid":"https://orcid.org/0000-0003-1815-7017"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhuyi Angelina Li","raw_affiliation_strings":["Renmin University of China,Business School,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Renmin University of China,Business School,Beijing,China","institution_ids":["https://openalex.org/I78988378"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5015222818"],"corresponding_institution_ids":["https://openalex.org/I4800084"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.27419596,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13114","display_name":"Image Processing Techniques and Applications","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/slicing","display_name":"Slicing","score":0.878464937210083},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7971453666687012},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5301253199577332},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3412827253341675},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3309047818183899},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.21803686022758484},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.1263464093208313}],"concepts":[{"id":"https://openalex.org/C2776190703","wikidata":"https://www.wikidata.org/wiki/Q488148","display_name":"Slicing","level":2,"score":0.878464937210083},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7971453666687012},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5301253199577332},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3412827253341675},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3309047818183899},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.21803686022758484},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.1263464093208313}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apsipaasc63619.2025.10849095","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc63619.2025.10849095","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W2552900565","https://openalex.org/W2795812085","https://openalex.org/W2883286874","https://openalex.org/W2964241181","https://openalex.org/W2964286567","https://openalex.org/W2993756598","https://openalex.org/W3011688396","https://openalex.org/W3092663126","https://openalex.org/W3119686997","https://openalex.org/W3127131334","https://openalex.org/W3127743092","https://openalex.org/W3172087149","https://openalex.org/W4307411363","https://openalex.org/W4307823382","https://openalex.org/W4382568144","https://openalex.org/W4386076222","https://openalex.org/W4386076325","https://openalex.org/W4402754006"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"The":[0,80,166],"detection":[1,115,201],"of":[2,86,109,143],"video":[3,149],"small":[4,41,57,199],"objects":[5,58],"is":[6,63,154],"challenging":[7],"in":[8,106],"images":[9],"due":[10],"to":[11,21,47,98,102,112,130,137,161,183,195],"their":[12],"limited":[13],"presence,":[14],"which":[15,158],"makes":[16],"the":[17,37,56,68,87,107,123,128,131,144,163,170,175,184,189,196],"information":[18],"more":[19],"susceptible":[20],"loss.":[22],"In":[23],"this":[24],"paper,":[25],"we":[26],"propose":[27],"an":[28],"Adaptive":[29,94],"Focused":[30],"Slicing":[31,96],"Detection":[32],"(AFSDet)":[33],"method":[34],"inspired":[35],"by":[36,180,191],"way":[38],"humans":[39],"observe":[40],"objects.":[42],"AFSDet":[43],"involves":[44],"first":[45,81],"localizing":[46],"a":[48,64,84,103,135,151],"region":[49],"with":[50],"potential":[51],"targets":[52],"and":[53,90,93,126,187],"then":[54],"scrutinizing":[55],"within":[59],"that":[60,169],"region.":[61],"It":[62],"two-stage":[65],"approach":[66],"utilizing":[67],"proposed":[69,171],"model":[70,125],"called":[71],"Deformable":[72],"Head":[73],"YOLO":[74],"Network":[75],"(DHYNet)":[76],"for":[77,156],"object":[78,200],"detection.":[79],"stage":[82,118],"performs":[83],"coarse-detection":[85],"original":[88],"image":[89],"utilizes":[91],"clustering":[92],"Scale-up":[95],"methods":[97],"obtain":[99],"patches,":[100],"leading":[101],"significant":[104],"reduction":[105],"number":[108],"patches":[110,121],"compared":[111,182,194],"previous":[113,197],"slicing-based":[114,198],"methods.The":[116],"second":[117],"feeds":[119],"each":[120],"into":[122],"fine-detection":[124],"passes":[127],"results":[129,167],"next":[132],"frame":[133],"as":[134],"reference":[136],"assist":[138],"coarse-detection.":[139],"Additionally,":[140],"taking":[141],"advantage":[142],"slight":[145],"variations":[146],"between":[147],"consecutive":[148],"frames,":[150],"superimposing":[152],"process":[153],"employed":[155],"coarse-detection,":[157],"also":[159],"contributes":[160],"reducing":[162],"computational":[164],"overhead.":[165],"show":[168],"method,":[172],"tested":[173],"on":[174],"VisDrone-MOT":[176],"dataset,":[177],"improves":[178,188],"accuracy":[179,190],"9.6%":[181],"baseline":[185],"model,":[186],"3.3":[192],"%":[193],"method.":[202]},"counts_by_year":[],"updated_date":"2025-12-19T19:40:27.379048","created_date":"2025-10-10T00:00:00"}
