{"id":"https://openalex.org/W4414229298","doi":"https://doi.org/10.1109/tcsvt.2025.3610634","title":"DAOcc: 3D Object Detection Assisted Multi-Sensor Fusion for 3D Occupancy Prediction","display_name":"DAOcc: 3D Object Detection Assisted Multi-Sensor Fusion for 3D Occupancy Prediction","publication_year":2025,"publication_date":"2025-09-16","ids":{"openalex":"https://openalex.org/W4414229298","doi":"https://doi.org/10.1109/tcsvt.2025.3610634"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2025.3610634","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3610634","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101558778","display_name":"Zhen Yang","orcid":"https://orcid.org/0000-0003-2487-1305"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhen Yang","raw_affiliation_strings":["Beijing Mechanical Equipment Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Mechanical Equipment Institute, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112380363","display_name":"Yanpeng Dong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yanpeng Dong","raw_affiliation_strings":["Beijing Mechanical Equipment Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Mechanical Equipment Institute, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102693572","display_name":"Jiayu Wang","orcid":"https://orcid.org/0009-0008-0736-8170"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiayu Wang","raw_affiliation_strings":["Beijing Mechanical Equipment Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Mechanical Equipment Institute, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112882339","display_name":"Heng Wang","orcid":"https://orcid.org/0009-0009-4627-7826"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Heng Wang","raw_affiliation_strings":["Beijing Mechanical Equipment Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Mechanical Equipment Institute, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028346364","display_name":"Lichao Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lichao Ma","raw_affiliation_strings":["Beijing Mechanical Equipment Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Mechanical Equipment Institute, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053085908","display_name":"Zhihua Cui","orcid":"https://orcid.org/0000-0001-7388-3180"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zijian Cui","raw_affiliation_strings":["Beijing Mechanical Equipment Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Mechanical Equipment Institute, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100453144","display_name":"Qi Liu","orcid":"https://orcid.org/0000-0001-5378-6404"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qi Liu","raw_affiliation_strings":["Beijing Mechanical Equipment Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Mechanical Equipment Institute, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000497101","display_name":"Haoran Pei","orcid":"https://orcid.org/0000-0003-2390-9447"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Haoran Pei","raw_affiliation_strings":["Beijing Mechanical Equipment Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Mechanical Equipment Institute, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069630739","display_name":"Kexin Zhang","orcid":"https://orcid.org/0000-0001-8950-2178"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kexin Zhang","raw_affiliation_strings":["Beijing Mechanical Equipment Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Mechanical Equipment Institute, Beijing, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100460227","display_name":"Chao Zhang","orcid":"https://orcid.org/0000-0002-9989-6462"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chao Zhang","raw_affiliation_strings":["Beijing Mechanical Equipment Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Beijing Mechanical Equipment Institute, Beijing, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5101558778"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.3498,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.85167228,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"36","issue":"2","first_page":"1742","last_page":"1753"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9879999756813049,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9793999791145325,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.8144999742507935},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.7135000228881836},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.5952000021934509},{"id":"https://openalex.org/keywords/image-fusion","display_name":"Image fusion","score":0.5583999752998352},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.5288000106811523},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.4677000045776367},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4659999907016754},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4397999942302704},{"id":"https://openalex.org/keywords/backbone-network","display_name":"Backbone network","score":0.41019999980926514}],"concepts":[{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.8144999742507935},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8112000226974487},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.7135000228881836},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6482999920845032},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.5952000021934509},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5701000094413757},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.5583999752998352},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.5288000106811523},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4677000045776367},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4659999907016754},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4397999942302704},{"id":"https://openalex.org/C88796919","wikidata":"https://www.wikidata.org/wiki/Q1142907","display_name":"Backbone network","level":2,"score":0.41019999980926514},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.40149998664855957},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.3862000107765198},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.36079999804496765},{"id":"https://openalex.org/C160331591","wikidata":"https://www.wikidata.org/wiki/Q7075743","display_name":"Occupancy","level":2,"score":0.3368000090122223},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.33379998803138733},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32910001277923584},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.328000009059906},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.31470000743865967},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.29919999837875366},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.29899999499320984},{"id":"https://openalex.org/C126422989","wikidata":"https://www.wikidata.org/wiki/Q93586","display_name":"Feature detection (computer vision)","level":4,"score":0.28439998626708984},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.2799000144004822},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2768999934196472},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2736000120639801},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.26649999618530273},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.265500009059906},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.25189998745918274}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2025.3610634","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3610634","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W2194775991","https://openalex.org/W2565639579","https://openalex.org/W2601564443","https://openalex.org/W2795587607","https://openalex.org/W2897529137","https://openalex.org/W2963351448","https://openalex.org/W2966926453","https://openalex.org/W3012573144","https://openalex.org/W3035574168","https://openalex.org/W3098650412","https://openalex.org/W3167095230","https://openalex.org/W3170030651","https://openalex.org/W3174692508","https://openalex.org/W3215584334","https://openalex.org/W4225986494","https://openalex.org/W4288325606","https://openalex.org/W4312707458","https://openalex.org/W4312894406","https://openalex.org/W4316660720","https://openalex.org/W4382450829","https://openalex.org/W4382464460","https://openalex.org/W4383066393","https://openalex.org/W4383108631","https://openalex.org/W4385151926","https://openalex.org/W4385804883","https://openalex.org/W4386083035","https://openalex.org/W4390872444","https://openalex.org/W4390872638","https://openalex.org/W4390873371","https://openalex.org/W4390873564","https://openalex.org/W4390874310","https://openalex.org/W4393149498","https://openalex.org/W4393156295","https://openalex.org/W4393159587","https://openalex.org/W4394708612","https://openalex.org/W4398150928","https://openalex.org/W4402186962","https://openalex.org/W4402713134","https://openalex.org/W4402733575","https://openalex.org/W4402754236","https://openalex.org/W4402754282","https://openalex.org/W4403721488","https://openalex.org/W4404102188","https://openalex.org/W4404410822","https://openalex.org/W4405197104","https://openalex.org/W4413144594","https://openalex.org/W4413146889","https://openalex.org/W4415795299"],"related_works":[],"abstract_inverted_index":{"Multi-sensor":[0],"fusion":[1,45,52],"significantly":[2],"enhances":[3],"the":[4,127],"accuracy":[5],"and":[6,19,29,93,129,132,146],"robustness":[7],"of":[8],"3D":[9,77],"semantic":[10],"occupancy":[11,72],"prediction,":[12],"which":[13],"is":[14,168],"crucial":[15],"for":[16,59],"autonomous":[17],"driving":[18],"robotics.":[20],"However,":[21],"most":[22],"existing":[23],"approaches":[24,46],"depend":[25],"on":[26,49,125,161],"high-resolution":[27],"images":[28],"complex":[30],"networks":[31],"to":[32,81,107],"achieve":[33],"top":[34],"performance,":[35,86],"hindering":[36],"their":[37],"deployment":[38],"in":[39,83],"practical":[40,94],"scenarios.":[41],"Moreover,":[42],"current":[43],"multi-sensor":[44],"mainly":[47],"focus":[48],"improving":[50],"feature":[51],"while":[53,87,157],"largely":[54],"neglecting":[55],"effective":[56],"supervision":[57,80],"strategies":[58],"those":[60],"features.":[61],"To":[62],"address":[63],"these":[64],"issues,":[65],"we":[66,99],"propose":[67],"DAOcc,":[68],"a":[69,89,101,138,143],"novel":[70],"multi-modal":[71],"prediction":[73],"framework":[74],"that":[75,119],"leverages":[76],"object":[78],"detection":[79],"assist":[82],"achieving":[84],"superior":[85],"using":[88,141],"deployment-friendly":[90],"image":[91,114],"backbone":[92,145],"input":[95,148],"resolution.":[96,115,149],"In":[97],"addition,":[98],"introduce":[100],"BEV":[102],"View":[103],"Range":[104],"Extension":[105],"strategy":[106],"mitigate":[108],"performance":[109],"degradation":[110],"caused":[111],"by":[112,137],"lower":[113],"Extensive":[116],"experiments":[117],"demonstrate":[118],"DAOcc":[120,153],"achieves":[121],"new":[122],"state-of-the-art":[123,135],"results":[124],"both":[126],"Occ3D-nuScenes":[128],"Occ3D-Waymo":[130],"benchmarks,":[131],"outperforms":[133],"previous":[134],"methods":[136],"significant":[139],"margin":[140],"only":[142],"ResNet-50":[144],"256\u00d7704":[147],"With":[150],"TensorRT":[151],"optimization,":[152],"reaches":[154],"104.9":[155],"FPS":[156],"maintaining":[158],"54.2":[159],"mIoU":[160],"an":[162],"NVIDIA":[163],"RTX":[164],"4090":[165],"GPU.":[166],"Code":[167],"available":[169],"at":[170],"https://github.com/AlphaPlusTT/DAOcc.":[171]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-18T14:38:29.013473","created_date":"2025-10-10T00:00:00"}
