{"id":"https://openalex.org/W4413925688","doi":"https://doi.org/10.1109/tmm.2025.3604917","title":"Enhanced Head: Exploring Strong Detection Heads With Vision Transformer","display_name":"Enhanced Head: Exploring Strong Detection Heads With Vision Transformer","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4413925688","doi":"https://doi.org/10.1109/tmm.2025.3604917"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2025.3604917","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3604917","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5060010090","display_name":"Zewen Du","orcid":"https://orcid.org/0009-0003-7091-8159"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zewen Du","raw_affiliation_strings":["National Key Lab of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0003-7091-8159","affiliations":[{"raw_affiliation_string":"National Key Lab of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102717988","display_name":"Zhenjiang Hu","orcid":"https://orcid.org/0000-0002-9034-205X"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhenjiang Hu","raw_affiliation_strings":["National Key Lab of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Key Lab of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061450079","display_name":"Guiyu Zhao","orcid":"https://orcid.org/0000-0002-5984-3390"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guiyu Zhao","raw_affiliation_strings":["National Key Lab of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Key Lab of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086463798","display_name":"Ying Jin","orcid":null},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ying Jin","raw_affiliation_strings":["National Key Lab of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Key Lab of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5072523018","display_name":"Hongbin Ma","orcid":"https://orcid.org/0000-0002-5734-3157"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongbin Ma","raw_affiliation_strings":["National Key Lab of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-5734-3157","affiliations":[{"raw_affiliation_string":"National Key Lab of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.18843112,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"27","issue":null,"first_page":"7834","last_page":"7848"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.545199990272522,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.545199990272522,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.4668999910354614,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7488524913787842},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5502660870552063},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.49096038937568665},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4848128855228424},{"id":"https://openalex.org/keywords/head","display_name":"Head (geology)","score":0.44150227308273315},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.32394105195999146},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.16044402122497559},{"id":"https://openalex.org/keywords/geology","display_name":"Geology","score":0.11658138036727905},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.11480522155761719},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09725522994995117}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7488524913787842},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5502660870552063},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.49096038937568665},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4848128855228424},{"id":"https://openalex.org/C2780312720","wikidata":"https://www.wikidata.org/wiki/Q5689100","display_name":"Head (geology)","level":2,"score":0.44150227308273315},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32394105195999146},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.16044402122497559},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.11658138036727905},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.11480522155761719},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09725522994995117},{"id":"https://openalex.org/C114793014","wikidata":"https://www.wikidata.org/wiki/Q52109","display_name":"Geomorphology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2025.3604917","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3604917","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2646844173","display_name":null,"funder_award_id":"62076028","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1536680647","https://openalex.org/W1861492603","https://openalex.org/W2102605133","https://openalex.org/W2161969291","https://openalex.org/W2168356304","https://openalex.org/W2194775991","https://openalex.org/W2549139847","https://openalex.org/W2565639579","https://openalex.org/W2601564443","https://openalex.org/W2886904239","https://openalex.org/W2934198733","https://openalex.org/W2962677013","https://openalex.org/W2962731685","https://openalex.org/W2963150697","https://openalex.org/W2963299996","https://openalex.org/W2963351448","https://openalex.org/W2964241181","https://openalex.org/W2982770724","https://openalex.org/W2986357608","https://openalex.org/W2989604896","https://openalex.org/W3012573144","https://openalex.org/W3035396860","https://openalex.org/W3035473155","https://openalex.org/W3035694605","https://openalex.org/W3109381875","https://openalex.org/W3131500599","https://openalex.org/W3138516171","https://openalex.org/W3157386596","https://openalex.org/W3171660447","https://openalex.org/W3175515048","https://openalex.org/W3176187859","https://openalex.org/W3205483686","https://openalex.org/W4205334590","https://openalex.org/W4214507171","https://openalex.org/W4312312588","https://openalex.org/W4312881242","https://openalex.org/W4313525589","https://openalex.org/W4385245566","https://openalex.org/W4386075524","https://openalex.org/W4386075796","https://openalex.org/W4386076053","https://openalex.org/W4386076325","https://openalex.org/W4390872693","https://openalex.org/W4390872937","https://openalex.org/W4399881572","https://openalex.org/W4410616160"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"As":[0],"a":[1,33,128,137],"crucial":[2],"component":[3],"of":[4],"object":[5],"detectors,":[6],"current":[7],"detection":[8,139,160],"heads":[9],"often":[10],"lack":[11],"the":[12,48,53,58,149,158,182],"capability":[13],"to":[14,20,39,51],"effectively":[15],"utilize":[16],"contextual":[17],"information,":[18],"adapt":[19],"deformable":[21,107],"objects,":[22],"and":[23,26,79,101,122,141,152,175],"align":[24],"features":[25,115],"tasks.":[27],"However,":[28],"most":[29],"existing":[30],"methods":[31],"prioritize":[32],"single":[34],"capability,":[35],"lacking":[36],"comprehensive":[37],"approaches":[38],"introduce":[40],"them":[41],"simultaneously.":[42],"In":[43],"this":[44],"paper,":[45],"we":[46,62],"propose":[47,63],"Enhanced":[49,134,163],"Head":[50,135,164],"integrate":[52],"above":[54],"three":[55,64],"capabilities":[56],"into":[57],"detectors":[59],"concurrently.":[60],"Specifically,":[61],"attention":[65],"blocks":[66],"with":[67,116],"linear":[68],"complexity:":[69],"Global":[70],"Concentrated":[71],"Attention":[72,77,82],"(GCA),":[73],"Local":[74],"Deformable":[75],"Cross-Task":[76,81],"(LDCA),":[78],"Boundary-Aware":[80],"(BACA).":[83],"The":[84,96,111],"GCA":[85],"captures":[86],"long-range":[87],"dependencies":[88],"efficiently":[89],"by":[90,104],"employing":[91],"Spatial":[92],"Information":[93],"Concentration":[94],"(SIC).":[95],"LDCA":[97],"improves":[98],"feature":[99,109],"alignment":[100,121],"deformation":[102,125],"adaptability":[103,126],"enabling":[105],"local":[106],"cross-task":[108],"interactions.":[110],"BACA":[112],"aligns":[113],"classification":[114],"localization":[117],"results,":[118],"enhancing":[119],"task":[120],"further":[123],"improving":[124],"through":[127,145],"region-deformable":[129],"interaction":[130],"scheme.":[131],"We":[132],"implement":[133],"as":[136],"plug-and-play":[138],"head":[140],"evaluate":[142],"its":[143],"effectiveness":[144],"extensive":[146],"experiments":[147],"on":[148,157],"MS":[150],"COCO":[151,159],"VisDrone":[153],"datasets.":[154],"For":[155],"instance,":[156],"benchmark,":[161],"our":[162],"achieves":[165],"+3.6":[166],"AP":[167,172,177],"gain":[168],"for":[169,173,178],"FSAF,":[170],"+3.3":[171],"RetinaNet,":[174],"+2.9":[176],"ATSS":[179],"while":[180],"reducing":[181],"FLOPs.":[183]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
