{"id":"https://openalex.org/W4399881572","doi":"https://doi.org/10.1109/tnnls.2024.3412947","title":"UniHead: Unifying Multi-Perception for Detection Heads","display_name":"UniHead: Unifying Multi-Perception for Detection Heads","publication_year":2024,"publication_date":"2024-06-21","ids":{"openalex":"https://openalex.org/W4399881572","doi":"https://doi.org/10.1109/tnnls.2024.3412947","pmid":"https://pubmed.ncbi.nlm.nih.gov/38905097"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2024.3412947","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2024.3412947","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5083942931","display_name":"Hantao Zhou","orcid":"https://orcid.org/0000-0002-0514-0905"},"institutions":[{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hantao Zhou","raw_affiliation_strings":["Tsinghua Shenzhen International Graduate School, Tsinghua University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101960406","display_name":"Rui Yang","orcid":"https://orcid.org/0000-0002-8760-5699"},"institutions":[{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rui Yang","raw_affiliation_strings":["Tsinghua Shenzhen International Graduate School, Tsinghua University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100667175","display_name":"Yachao Zhang","orcid":"https://orcid.org/0000-0002-1150-8745"},"institutions":[{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yachao Zhang","raw_affiliation_strings":["Tsinghua Shenzhen International Graduate School, Tsinghua University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083020611","display_name":"Haoran Duan","orcid":"https://orcid.org/0000-0001-9956-7020"},"institutions":[{"id":"https://openalex.org/I190082696","display_name":"Durham University","ror":"https://ror.org/01v29qb04","country_code":"GB","type":"education","lineage":["https://openalex.org/I190082696"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Haoran Duan","raw_affiliation_strings":["Department of Computer Science, Durham University, Durham, U.K"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Durham University, Durham, U.K","institution_ids":["https://openalex.org/I190082696"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101524563","display_name":"Yawen Huang","orcid":"https://orcid.org/0000-0002-9569-269X"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yawen Huang","raw_affiliation_strings":["Tencent Jarvis Laboratory, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tencent Jarvis Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011299161","display_name":"Runze Hu","orcid":"https://orcid.org/0000-0002-6366-3763"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Runze Hu","raw_affiliation_strings":["School of Information and Electronics, Beijing Institute of Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Information and Electronics, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100754504","display_name":"Xiu Li","orcid":"https://orcid.org/0000-0003-0403-1923"},"institutions":[{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiu Li","raw_affiliation_strings":["Tsinghua Shenzhen International Graduate School, Tsinghua University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5051649145","display_name":"Yefeng Zheng","orcid":"https://orcid.org/0000-0003-2195-2847"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yefeng Zheng","raw_affiliation_strings":["Tencent Jarvis Laboratory, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tencent Jarvis Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5083942931"],"corresponding_institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":5.1447,"has_fulltext":false,"cited_by_count":22,"citation_normalized_percentile":{"value":0.9650108,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"36","issue":"5","first_page":"9565","last_page":"9576"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.972599983215332,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9693999886512756,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.6929685473442078},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5743861198425293},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3808457553386688},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.31693655252456665},{"id":"https://openalex.org/keywords/neuroscience","display_name":"Neuroscience","score":0.07296273112297058}],"concepts":[{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.6929685473442078},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5743861198425293},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3808457553386688},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.31693655252456665},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.07296273112297058}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2024.3412947","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2024.3412947","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:38905097","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/38905097","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.4300000071525574}],"awards":[{"id":"https://openalex.org/G2935957626","display_name":null,"funder_award_id":"62192712","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7660887274","display_name":null,"funder_award_id":"2020AAA0108303","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G8786339038","display_name":null,"funder_award_id":"WDZC20200820200655001","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":68,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1536680647","https://openalex.org/W1861492603","https://openalex.org/W2031489346","https://openalex.org/W2108598243","https://openalex.org/W2194775991","https://openalex.org/W2565639579","https://openalex.org/W2601564443","https://openalex.org/W2752782242","https://openalex.org/W2884367402","https://openalex.org/W2963150697","https://openalex.org/W2963351448","https://openalex.org/W2963849369","https://openalex.org/W2963857746","https://openalex.org/W2964241181","https://openalex.org/W2964444661","https://openalex.org/W2966926453","https://openalex.org/W2981689412","https://openalex.org/W2982770724","https://openalex.org/W2986357608","https://openalex.org/W3034971973","https://openalex.org/W3035396860","https://openalex.org/W3035473155","https://openalex.org/W3035694605","https://openalex.org/W3042011474","https://openalex.org/W3122490299","https://openalex.org/W3131500599","https://openalex.org/W3138516171","https://openalex.org/W3139049060","https://openalex.org/W3165215538","https://openalex.org/W3167308647","https://openalex.org/W3171660447","https://openalex.org/W3172752666","https://openalex.org/W3176187859","https://openalex.org/W3208871062","https://openalex.org/W4214507171","https://openalex.org/W4220899212","https://openalex.org/W4225745741","https://openalex.org/W4226083961","https://openalex.org/W4288325606","https://openalex.org/W4312312588","https://openalex.org/W4312628331","https://openalex.org/W4312956471","https://openalex.org/W4313007769","https://openalex.org/W4313427331","https://openalex.org/W4318141851","https://openalex.org/W4318953563","https://openalex.org/W4319068750","https://openalex.org/W4362653142","https://openalex.org/W4367048262","https://openalex.org/W4379117118","https://openalex.org/W4386083115","https://openalex.org/W4386108434","https://openalex.org/W4390707165","https://openalex.org/W4390872682","https://openalex.org/W4390873252","https://openalex.org/W4390874491","https://openalex.org/W4392904609","https://openalex.org/W6767109091","https://openalex.org/W6772853553","https://openalex.org/W6779586474","https://openalex.org/W6780959388","https://openalex.org/W6784094891","https://openalex.org/W6811230874","https://openalex.org/W6839204056","https://openalex.org/W6848963243","https://openalex.org/W6855917929","https://openalex.org/W6869262221"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2382290278","https://openalex.org/W4395014643"],"abstract_inverted_index":{"The":[0,187],"detection":[1,72],"head":[2,23],"constitutes":[3],"a":[4,50,54,60,99,115,135],"pivotal":[5],"component":[6],"within":[7],"object":[8,95],"detectors,":[9],"tasked":[10],"with":[11,145],"executing":[12],"both":[13],"classification":[14,125],"and":[15,37,56,112,126,181],"localization":[16,127],"functions.":[17],"Regrettably,":[18],"the":[19,90,124,131,138,151,167],"commonly":[20],"used":[21],"parallel":[22],"often":[24],"lacks":[25],"omni":[26],"perceptual":[27,79],"capabilities,":[28],"such":[29],"as":[30],"deformation":[31],"perception":[32,35,39],"(DP),":[33],"global":[34],"(GP),":[36],"cross-task":[38,116],"(CTP).":[40],"Despite":[41],"numerous":[42],"methods":[43],"attempting":[44],"to":[45,65,76,92,104,162],"enhance":[46],"these":[47],"abilities":[48,80],"from":[49],"single":[51],"aspect,":[52],"achieving":[53,110],"comprehensive":[55],"unified":[57],"solution":[58],"remains":[59],"significant":[61,160],"challenge.":[62],"In":[63],"response":[64],"this":[66],"challenge,":[67],"we":[68],"develop":[69],"an":[70],"innovative":[71],"head,":[73],"termed":[74],"UniHead,":[75],"unify":[77],"three":[78],"simultaneously.":[81],"More":[82],"precisely,":[83],"our":[84,156],"approach:":[85],"1)":[86],"introduces":[87],"DP,":[88],"enabling":[89],"model":[91,106],"adaptively":[93],"sample":[94],"features;":[96],"2)":[97],"proposes":[98],"dual-axial":[100],"aggregation":[101],"transformer":[102,118],"(DAT)":[103],"adeptly":[105],"long-range":[107],"dependencies,":[108],"thereby":[109],"GP;":[111],"3)":[113],"devises":[114],"interaction":[117,122],"(CIT)":[119],"that":[120,155],"facilitates":[121],"between":[123],"branches,":[128],"thus":[129],"aligning":[130],"two":[132],"tasks.":[133],"As":[134],"plug-and-play":[136],"method,":[137],"proposed":[139],"UniHead":[140,157,168],"can":[141,158,169],"be":[142],"conveniently":[143],"integrated":[144],"existing":[146],"detectors.":[147,164],"Extensive":[148],"experiments":[149],"on":[150],"COCO":[152],"dataset":[153],"demonstrate":[154],"bring":[159],"improvements":[161],"many":[163],"For":[165],"instance,":[166],"obtain":[170],"+2.7":[171],"AP":[172,177,183],"gains":[173,178,184],"in":[174,179,185],"RetinaNet,":[175],"+2.9":[176],"FreeAnchor,":[180],"+2.1":[182],"GFL.":[186],"code":[188],"is":[189],"available":[190],"at":[191],"https://github.com/zht8506/UniHead.":[192]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
