{"id":"https://openalex.org/W7131798988","doi":"https://doi.org/10.3837/tiis.2026.02.014","title":"HAT-YOLO: Hybrid Attention and Transformer-Integrated Model for UAV Object Detection on Embedded Devices","display_name":"HAT-YOLO: Hybrid Attention and Transformer-Integrated Model for UAV Object Detection on Embedded Devices","publication_year":2026,"publication_date":"2026-02-27","ids":{"openalex":"https://openalex.org/W7131798988","doi":"https://doi.org/10.3837/tiis.2026.02.014"},"language":null,"primary_location":{"id":"doi:10.3837/tiis.2026.02.014","is_oa":true,"landing_page_url":"https://doi.org/10.3837/tiis.2026.02.014","pdf_url":"https://itiis.org/digital-library/manuscript/file/105901/TIIS Vol 20, No 2-14.pdf","source":{"id":"https://openalex.org/S204131793","display_name":"KSII Transactions on Internet and Information Systems","issn_l":"1976-7277","issn":["1976-7277","2288-1468"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4323966148","host_organization_name":"Korea Society of Internet Information","host_organization_lineage":["https://openalex.org/P4323966148"],"host_organization_lineage_names":["Korea Society of Internet Information"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"KSII Transactions on Internet and Information Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://itiis.org/digital-library/manuscript/file/105901/TIIS Vol 20, No 2-14.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108962193","display_name":"Md. Minhazul Haq","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Md. Minhazul Haq","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122966606","display_name":"Anis Salwa Mohd Khairuddin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Anis Salwa Mohd Khairuddin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037634436","display_name":"Effariza Hanafi","orcid":"https://orcid.org/0000-0001-6384-0435"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Effariza Hanafi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010156990","display_name":"Hafiz Muhammad Fahad Noman","orcid":"https://orcid.org/0000-0001-8507-5383"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hafiz Muhammad Fahad Noman","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5034164631","display_name":"Mohamad Haniff Junos","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mohamad Haniff Junos","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5108962193"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.73972445,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"20","issue":"2","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.5764999985694885,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.5764999985694885,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12389","display_name":"Infrared Target Detection Methodologies","score":0.03099999949336052,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.02930000051856041,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.6901000142097473},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5548999905586243},{"id":"https://openalex.org/keywords/drone","display_name":"Drone","score":0.289000004529953},{"id":"https://openalex.org/keywords/object-class-detection","display_name":"Object-class detection","score":0.28439998626708984}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.906000018119812},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.6901000142097473},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6272000074386597},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5989999771118164},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5548999905586243},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.4311999976634979},{"id":"https://openalex.org/C59519942","wikidata":"https://www.wikidata.org/wiki/Q650665","display_name":"Drone","level":2,"score":0.289000004529953},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.28859999775886536},{"id":"https://openalex.org/C71681937","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object-class detection","level":5,"score":0.28439998626708984},{"id":"https://openalex.org/C4641261","wikidata":"https://www.wikidata.org/wiki/Q11681085","display_name":"Face detection","level":4,"score":0.2676999866962433}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3837/tiis.2026.02.014","is_oa":true,"landing_page_url":"https://doi.org/10.3837/tiis.2026.02.014","pdf_url":"https://itiis.org/digital-library/manuscript/file/105901/TIIS Vol 20, No 2-14.pdf","source":{"id":"https://openalex.org/S204131793","display_name":"KSII Transactions on Internet and Information Systems","issn_l":"1976-7277","issn":["1976-7277","2288-1468"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4323966148","host_organization_name":"Korea Society of Internet Information","host_organization_lineage":["https://openalex.org/P4323966148"],"host_organization_lineage_names":["Korea Society of Internet Information"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"KSII Transactions on Internet and Information Systems","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.3837/tiis.2026.02.014","is_oa":true,"landing_page_url":"https://doi.org/10.3837/tiis.2026.02.014","pdf_url":"https://itiis.org/digital-library/manuscript/file/105901/TIIS Vol 20, No 2-14.pdf","source":{"id":"https://openalex.org/S204131793","display_name":"KSII Transactions on Internet and Information Systems","issn_l":"1976-7277","issn":["1976-7277","2288-1468"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4323966148","host_organization_name":"Korea Society of Internet Information","host_organization_lineage":["https://openalex.org/P4323966148"],"host_organization_lineage_names":["Korea Society of Internet Information"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"KSII Transactions on Internet and Information Systems","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.5054135322570801,"display_name":"Affordable and clean energy"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7131798988.pdf","grobid_xml":"https://content.openalex.org/works/W7131798988.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"rapid":[1],"advancement":[2],"of":[3,12],"unmanned":[4],"aerial":[5,69],"vehicles":[6],"(UAVs)":[7],"has":[8],"increased":[9],"the":[10],"demand":[11],"accurate,":[13],"lightweight":[14,94,172],"and":[15,39,118,126,130,139,154,158,160,166,178,189,213],"real-time":[16,195],"object":[17,25,41],"detection":[18,26,67,196,209],"models":[19,47],"suitable":[20],"for":[21,64,99,112,220],"embedded":[22,223],"deployment.However,":[23],"target":[24],"from":[27],"remote":[28],"sensing":[29],"images":[30,70],"is":[31],"challenging":[32],"due":[33],"to":[34,89],"scale":[35],"variation,":[36],"complex":[37],"backgrounds":[38],"high":[40],"density.Additionally,":[42],"many":[43],"existing":[44],"deep":[45],"learning-based":[46],"require":[48],"large":[49],"GPU":[50,142],"memory.To":[51],"overcome":[52],"these":[53],"limitations,":[54],"we":[55],"proposed":[56,75],"a":[57,82],"HAT-YOLO":[58,76,122,147,183],"model,":[59],"an":[60],"improved":[61,148],"YOLOv8n-based":[62],"architecture":[63,173],"efficient":[65],"vehicle":[66],"in":[68,156,162],"using":[71,133],"limited":[72],"memory":[73],"devices.The":[74],"model":[77,123,206],"introduces":[78],"three":[79],"key":[80],"modules.Firstly,":[81],"dual":[83],"channel-spatial":[84],"attention":[85],"based":[86,96],"A2C2":[87],"module":[88,98,111],"improve":[90],"local":[91],"feature":[92,104,116],"discrimination.Secondly,":[93],"transformer":[95],"TA2C2":[97],"better":[100],"long-range":[101],"global":[102],"context":[103],"extraction.Finally,":[105],"GELU":[106],"activation":[107],"function":[108],"integrated":[109],"CBG":[110],"faster":[113],"convergence,":[114],"non-linear":[115],"representation":[117],"lower":[119],"processing":[120],"time.The":[121],"was":[124],"trained":[125],"evaluated":[127],"on":[128,164,187,192,198,222],"VEDAI":[129,165,188],"RSOD":[131,167],"datasets":[132],"NVIDIA":[134],"RTX":[135],"A2000,":[136],"Google":[137],"Colab":[138],"Jetson":[140,181],"Nano":[141],"platforms.Experimental":[143],"results":[144,201],"demonstrate":[145],"that":[146,203],"accuracy":[149],"over":[150],"YOLOv8n":[151],"by":[152],"6.7%":[153],"4.2%":[155],"mAP@0.5":[157],"6.1%":[159],"3.2%":[161],"mAP@0.5:0.95":[163],"datasets,":[168],"respectively,":[169],"while":[170],"maintaining":[171],"with":[174],"3.82":[175],"million":[176],"parameters":[177],"8.9":[179],"GFLOPs.On":[180],"Nano,":[182],"achieves":[184],"17.2":[185],"FPS":[186,191],"18.4":[190],"RSOD,":[193],"indicating":[194],"performance":[197],"resource-constrained":[199],"devices.These":[200],"show":[202],"our":[204],"developed":[205],"effectively":[207],"balances":[208],"accuracy,":[210],"architectural":[211],"complexity":[212],"inference":[214],"speed,":[215],"making":[216],"it":[217],"highly":[218],"feasible":[219],"deployment":[221],"platforms.":[224]},"counts_by_year":[],"updated_date":"2026-03-11T06:11:40.159057","created_date":"2026-02-27T00:00:00"}
