{"id":"https://openalex.org/W4391768428","doi":"https://doi.org/10.1109/itsc57777.2023.10422455","title":"Small Object Detector Using Contextual Local Features and Global Representations for Autonomous Driving","display_name":"Small Object Detector Using Contextual Local Features and Global Representations for Autonomous Driving","publication_year":2023,"publication_date":"2023-09-24","ids":{"openalex":"https://openalex.org/W4391768428","doi":"https://doi.org/10.1109/itsc57777.2023.10422455"},"language":"en","primary_location":{"id":"doi:10.1109/itsc57777.2023.10422455","is_oa":false,"landing_page_url":"https://doi.org/10.1109/itsc57777.2023.10422455","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 26th International Conference on Intelligent Transportation Systems (ITSC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5089890948","display_name":"Xuke Wu","orcid":"https://orcid.org/0009-0004-0055-1758"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xuke Wu","raw_affiliation_strings":["School of Artificial Intelligence, University of Chinese Academy of Sciences,Beijing,China,100049","State Key Laboratory of Multimodal Artificial Intelligence Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences,Beijing,China,100049","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"State Key Laboratory of Multimodal Artificial Intelligence Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112113074","display_name":"Bin Tian","orcid":"https://orcid.org/0000-0003-1050-1282"},"institutions":[{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Tian","raw_affiliation_strings":["Institute of Automation, Chinese Academy of Sciences,State Key Laboratory of Multimodal Artificial Intelligence Systems,Beijing,China,100190"],"affiliations":[{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Sciences,State Key Laboratory of Multimodal Artificial Intelligence Systems,Beijing,China,100190","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088979194","display_name":"Gang Xiong","orcid":"https://orcid.org/0000-0002-4303-5559"},"institutions":[{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gang Xiong","raw_affiliation_strings":["Institute of Automation, Chinese Academy of Sciences,Beijing Engineering Research Center of Intelligent Systems and Technology,China","Beijing Engineering Research Center of Intelligent Systems and Technology, Institute of Automation, Chinese Academy of Sciences, China"],"affiliations":[{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Sciences,Beijing Engineering Research Center of Intelligent Systems and Technology,China","institution_ids":["https://openalex.org/I4210094879","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Beijing Engineering Research Center of Intelligent Systems and Technology, Institute of Automation, Chinese Academy of Sciences, China","institution_ids":["https://openalex.org/I4210094879","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032701630","display_name":"Bing Song","orcid":"https://orcid.org/0000-0002-7182-0175"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bing Song","raw_affiliation_strings":["School of Artificial Intelligence, University of Chinese Academy of Sciences,Beijing,China,100049","State Key Laboratory of Multimodal Artificial Intelligence Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences,Beijing,China,100049","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"State Key Laboratory of Multimodal Artificial Intelligence Systems, Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025706580","display_name":"Peijun Ye","orcid":"https://orcid.org/0000-0001-9987-9016"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peijun Ye","raw_affiliation_strings":["Institute of Automation, Chinese Academy of Sciences,State Key Laboratory of Multimodal Artificial Intelligence Systems,Beijing,China,100190"],"affiliations":[{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Sciences,State Key Laboratory of Multimodal Artificial Intelligence Systems,Beijing,China,100190","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042359485","display_name":"Fenghua Zhu","orcid":"https://orcid.org/0000-0003-2886-6968"},"institutions":[{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fenghua Zhu","raw_affiliation_strings":["Institute of Automation, Chinese Academy of Sciences,State Key Laboratory of Multimodal Artificial Intelligence Systems,Beijing,China,100190"],"affiliations":[{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Sciences,State Key Laboratory of Multimodal Artificial Intelligence Systems,Beijing,China,100190","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5089890948"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210112150","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.1228,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.46403436,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"4396","last_page":"4401"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.963100016117096,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.963100016117096,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9189000129699707,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.653767466545105},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5651232004165649},{"id":"https://openalex.org/keywords/detector","display_name":"Detector","score":0.5433609485626221},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5335184931755066},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5168057680130005},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.46652254462242126},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.2396620512008667},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.11577147245407104}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.653767466545105},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5651232004165649},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.5433609485626221},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5335184931755066},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5168057680130005},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.46652254462242126},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2396620512008667},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.11577147245407104}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/itsc57777.2023.10422455","is_oa":false,"landing_page_url":"https://doi.org/10.1109/itsc57777.2023.10422455","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 26th International Conference on Intelligent Transportation Systems (ITSC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3064315853","display_name":null,"funder_award_id":"U1909204,61876011,52071312","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W2194775991","https://openalex.org/W2601564443","https://openalex.org/W2618530766","https://openalex.org/W2955058313","https://openalex.org/W2963150697","https://openalex.org/W2981958729","https://openalex.org/W2997225633","https://openalex.org/W3094502228","https://openalex.org/W3096609285","https://openalex.org/W3121523901","https://openalex.org/W3138516171","https://openalex.org/W3160694286","https://openalex.org/W3168114581","https://openalex.org/W4213019189","https://openalex.org/W4214493665","https://openalex.org/W4289752563","https://openalex.org/W4296501493","https://openalex.org/W4308080010","https://openalex.org/W4312526244","https://openalex.org/W4319336343","https://openalex.org/W4324119491","https://openalex.org/W4385245566","https://openalex.org/W4386608660","https://openalex.org/W6751733626","https://openalex.org/W6762718338","https://openalex.org/W6796617330"],"related_works":["https://openalex.org/W2755342338","https://openalex.org/W2058170566","https://openalex.org/W2036807459","https://openalex.org/W2772917594","https://openalex.org/W2775347418","https://openalex.org/W1969923398","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2079911747"],"abstract_inverted_index":{"We":[0],"present":[1],"a":[2,56,112],"hybrid":[3],"architecture":[4],"called":[5],"Contextual-Enhanced":[6],"Transformer":[7],"Network":[8],"(CEFormer)":[9],"that":[10,60,85,117],"leverages":[11],"both":[12,65],"Convolutional":[13],"Neural":[14],"Networks":[15],"(CNN)":[16],"and":[17,36,67,81,87,91,121,139,142,157],"transformer-style":[18],"networks":[19],"for":[20,69,97],"computer":[21],"vision":[22],"tasks.":[23],"CNNs":[24,66],"are":[25,41],"good":[26,42],"at":[27,43],"modeling":[28],"local":[29,34],"features":[30,47,90,93],"due":[31,48],"to":[32,49],"their":[33,50],"nature":[35],"weight":[37],"sharing,":[38],"while":[39],"transformers":[40,68],"capturing":[44],"global":[45],"contextual":[46,82,92],"self-attention":[51],"mechanism.":[52],"Our":[53,128],"CEFormer":[54,129],"uses":[55],"parallel":[57],"network":[58],"structure":[59],"combines":[61],"the":[62,98,119,125],"strengths":[63],"of":[64,100,124],"image":[70],"feature":[71,126],"representation.":[72],"Specifically,":[73],"we":[74,110],"design":[75],"an":[76,105],"enhanced":[77],"multi-headed":[78],"attention":[79,83],"module":[80,84,116],"extracts":[86],"enhances":[88],"globle":[89],"on":[94,153],"two":[95],"branches":[96],"task":[99],"small":[101],"target":[102,134],"detection":[103,135],"in":[104,133],"autonomous":[106],"driving":[107],"environment.":[108],"Moreover,":[109],"propose":[111],"lightweight":[113],"cross-branch":[114],"fusion":[115],"reduces":[118],"parameters":[120],"computational":[122],"complexity":[123],"interaction.":[127],"achieves":[130],"competitive":[131],"results":[132],"with":[136],"Mask":[137],"R-CNN":[138],"outperforms":[140],"ResNet":[141],"transformer-based":[143],"models.":[144],"It":[145],"also":[146],"shows":[147],"significant":[148],"improvement":[149],"over":[150],"other":[151],"methods":[152],"MS":[154],"COCO,":[155],"TT100K,":[156],"ImageNet":[158],"datasets.":[159]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
