{"id":"https://openalex.org/W4401414324","doi":"https://doi.org/10.1109/icra57147.2024.10611684","title":"VOOM: Robust Visual Object Odometry and Mapping using Hierarchical Landmarks","display_name":"VOOM: Robust Visual Object Odometry and Mapping using Hierarchical Landmarks","publication_year":2024,"publication_date":"2024-05-13","ids":{"openalex":"https://openalex.org/W4401414324","doi":"https://doi.org/10.1109/icra57147.2024.10611684"},"language":"en","primary_location":{"id":"doi:10.1109/icra57147.2024.10611684","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra57147.2024.10611684","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100631530","display_name":"Yutong Wang","orcid":"https://orcid.org/0000-0003-2981-7471"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yutong Wang","raw_affiliation_strings":["Beijing Institute of Technology,School of Mechanical Engineering,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology,School of Mechanical Engineering,China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075033951","display_name":"Chaoyang Jiang","orcid":"https://orcid.org/0000-0002-8669-2911"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chaoyang Jiang","raw_affiliation_strings":["Beijing Institute of Technology,School of Mechanical Engineering,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology,School of Mechanical Engineering,China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5032262344","display_name":"Xieyuanli Chen","orcid":"https://orcid.org/0000-0003-0955-6681"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xieyuanli Chen","raw_affiliation_strings":["National University of Defense Technology,College of Intelligence Science and Technology,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National University of Defense Technology,College of Intelligence Science and Technology,China","institution_ids":["https://openalex.org/I170215575"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100631530"],"corresponding_institution_ids":["https://openalex.org/I125839683"],"apc_list":null,"apc_paid":null,"fwci":17.6338,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.9882367,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"10298","last_page":"10304"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11211","display_name":"3D Surveying and Cultural Heritage","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1907","display_name":"Geology"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7988932728767395},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.7603600025177002},{"id":"https://openalex.org/keywords/visual-odometry","display_name":"Visual odometry","score":0.7493142485618591},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7479982972145081},{"id":"https://openalex.org/keywords/odometry","display_name":"Odometry","score":0.5440664887428284},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5100675225257874},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.32932937145233154},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.17981505393981934},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.09643527865409851}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7988932728767395},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7603600025177002},{"id":"https://openalex.org/C5799516","wikidata":"https://www.wikidata.org/wiki/Q4110915","display_name":"Visual odometry","level":3,"score":0.7493142485618591},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7479982972145081},{"id":"https://openalex.org/C49441653","wikidata":"https://www.wikidata.org/wiki/Q2014717","display_name":"Odometry","level":4,"score":0.5440664887428284},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5100675225257874},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32932937145233154},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.17981505393981934},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.09643527865409851}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra57147.2024.10611684","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra57147.2024.10611684","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5699999928474426,"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W612478963","https://openalex.org/W1612997784","https://openalex.org/W2021851106","https://openalex.org/W2097696373","https://openalex.org/W2140427427","https://openalex.org/W2151290401","https://openalex.org/W2152671441","https://openalex.org/W2474281075","https://openalex.org/W2535547924","https://openalex.org/W2610694266","https://openalex.org/W2745859992","https://openalex.org/W2887751724","https://openalex.org/W2888144883","https://openalex.org/W2937713253","https://openalex.org/W2938672559","https://openalex.org/W2963357556","https://openalex.org/W2964226622","https://openalex.org/W2967862165","https://openalex.org/W3020500358","https://openalex.org/W3083706479","https://openalex.org/W3083815714","https://openalex.org/W3090386798","https://openalex.org/W3098467253","https://openalex.org/W3099913005","https://openalex.org/W3102327032","https://openalex.org/W3199149066","https://openalex.org/W3207330959","https://openalex.org/W3208154594","https://openalex.org/W4311912364","https://openalex.org/W4322731032","https://openalex.org/W4377000514","https://openalex.org/W6802878479"],"related_works":["https://openalex.org/W2979950214","https://openalex.org/W87609089","https://openalex.org/W3024737167","https://openalex.org/W2414561716","https://openalex.org/W3161199934","https://openalex.org/W2303855011","https://openalex.org/W2312326526","https://openalex.org/W2412578866","https://openalex.org/W3105866016","https://openalex.org/W4312703710"],"abstract_inverted_index":{"In":[0,71,158],"recent":[1],"years,":[2],"object-oriented":[3,203],"simultaneous":[4],"localization":[5,32],"and":[6,80,87,114,153,175,187,205],"mapping":[7,195],"(SLAM)":[8],"has":[9],"attracted":[10],"increasing":[11],"attention":[12],"due":[13],"to":[14,17,30,124,145,169],"its":[15],"ability":[16],"provide":[18],"high-level":[19,85],"semantic":[20],"information":[21,144],"while":[22],"maintaining":[23],"computational":[24],"efficiency.":[25],"Some":[26],"researchers":[27],"have":[28,45],"attempted":[29],"enhance":[31,146],"accuracy":[33],"by":[34],"integrating":[35],"the":[36,55,91,130,147,156,159,164,172,176,185],"modeled":[37],"object":[38,58,102,143,161,194],"residuals":[39,103],"into":[40],"bundle":[41,105,180],"adjustment.":[42,106],"However,":[43],"few":[44],"demonstrated":[46],"better":[47],"results":[48],"than":[49,68],"feature-based":[50],"visual":[51,160,193],"SLAM":[52,204,208],"systems,":[53],"as":[54,61,90,211],"generic":[56],"coarse":[57],"models,":[59],"such":[60,210],"cuboids":[62],"or":[63],"ellipsoids,":[64],"are":[65],"less":[66],"accurate":[67],"feature":[69,151,206],"points.":[70],"this":[72],"paper,":[73],"we":[74,108,141],"propose":[75],"a":[76,95,115,133],"Visual":[77],"Object":[78],"Odometry":[79],"Mapping":[81],"framework":[82],"VOOM":[83,200],"using":[84,101],"objects":[86,186],"low-level":[88],"points":[89,152,207],"hierarchical":[92],"landmarks":[93],"in":[94,104,191,213],"coarse-to-fine":[96],"manner":[97],"instead":[98],"of":[99,132,150,215,219],"directly":[100],"Firstly,":[107],"introduce":[109],"an":[110],"improved":[111],"observation":[112],"model":[113],"novel":[116],"data":[117,148],"association":[118,149],"method":[119,221],"for":[120],"dual":[121],"quadrics,":[122],"employed":[123,168],"represent":[125],"physical":[126],"objects.":[127,177],"It":[128],"facilitates":[129],"creation":[131],"3D":[134],"map":[135,166],"that":[136,199],"closely":[137],"reflects":[138],"reality.":[139],"Next,":[140],"use":[142],"consequently":[154],"update":[155],"map.":[157],"odometry":[162],"backend,":[163],"updated":[165],"is":[167,182,222],"further":[170],"optimize":[171],"camera":[173],"pose":[174],"Meanwhile,":[178],"local":[179],"adjustment":[181],"performed":[183],"utilizing":[184],"points-based":[188],"covisibility":[189],"graphs":[190],"our":[192,220],"process.":[196],"Experiments":[197],"show":[198],"outperforms":[201],"both":[202],"systems":[209],"ORB-SLAM2":[212],"terms":[214],"localization.":[216],"The":[217],"implementation":[218],"available":[223],"at":[224],"https://github.com/yutongwangBIT/VOOM.git.":[225]},"counts_by_year":[{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":2}],"updated_date":"2026-05-02T08:42:23.175194","created_date":"2025-10-10T00:00:00"}
