{"id":"https://openalex.org/W7127918475","doi":"https://doi.org/10.48550/arxiv.2602.05855","title":"A Hybrid Autoencoder for Robust Heightmap Generation from Fused Lidar and Depth Data for Humanoid Robot Locomotion","display_name":"A Hybrid Autoencoder for Robust Heightmap Generation from Fused Lidar and Depth Data for Humanoid Robot Locomotion","publication_year":2026,"publication_date":"2026-02-05","ids":{"openalex":"https://openalex.org/W7127918475","doi":"https://doi.org/10.48550/arxiv.2602.05855"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.05855","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125169247","display_name":"Dennis Bank","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Bank, Dennis","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125122021","display_name":"Joost Cordes","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cordes, Joost","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039578386","display_name":"Thomas Seel","orcid":"https://orcid.org/0000-0002-6920-1690"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Seel, Thomas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5028312231","display_name":"Simon F. G. Ehlers","orcid":"https://orcid.org/0000-0001-5524-6639"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ehlers, Simon F. G.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5125169247"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.7878999710083008,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.7878999710083008,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12153","display_name":"Advanced Optical Sensing Technologies","score":0.04340000078082085,"subfield":{"id":"https://openalex.org/subfields/3105","display_name":"Instrumentation"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.019200000911951065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/humanoid-robot","display_name":"Humanoid robot","score":0.6292999982833862},{"id":"https://openalex.org/keywords/lidar","display_name":"Lidar","score":0.5641000270843506},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.527400016784668},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.512499988079071},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.5016999840736389},{"id":"https://openalex.org/keywords/terrain","display_name":"Terrain","score":0.45089998841285706},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.42590001225471497},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.42410001158714294},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.42399999499320984}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7620999813079834},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7440000176429749},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6452999711036682},{"id":"https://openalex.org/C60692881","wikidata":"https://www.wikidata.org/wiki/Q584529","display_name":"Humanoid robot","level":3,"score":0.6292999982833862},{"id":"https://openalex.org/C51399673","wikidata":"https://www.wikidata.org/wiki/Q504027","display_name":"Lidar","level":2,"score":0.5641000270843506},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.527400016784668},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.512499988079071},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.5016999840736389},{"id":"https://openalex.org/C161840515","wikidata":"https://www.wikidata.org/wiki/Q186131","display_name":"Terrain","level":2,"score":0.45089998841285706},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.42590001225471497},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.42410001158714294},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.42399999499320984},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4120999872684479},{"id":"https://openalex.org/C115051666","wikidata":"https://www.wikidata.org/wiki/Q6522493","display_name":"Ranging","level":2,"score":0.34470000863075256},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.33160001039505005},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.32919999957084656},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.32690000534057617},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.3240000009536743},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.31380000710487366},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2912999987602234},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2858999967575073},{"id":"https://openalex.org/C141268832","wikidata":"https://www.wikidata.org/wiki/Q2940499","display_name":"Depth map","level":3,"score":0.2809000015258789},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.27950000762939453},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.2524000108242035}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.05855","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.05855","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.05855","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.05855","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Reliable":[0],"terrain":[1],"perception":[2],"is":[3,45],"a":[4,30,48,59,79,114],"critical":[5],"prerequisite":[6],"for":[7,53,65],"the":[8,111],"deployment":[9],"of":[10,113],"humanoid":[11],"robots":[12],"in":[13],"unstructured,":[14],"human-centric":[15],"environments.":[16],"While":[17],"traditional":[18],"systems":[19],"often":[20],"rely":[21],"on":[22],"manually":[23],"engineered,":[24],"single-sensor":[25],"pipelines,":[26],"this":[27],"paper":[28],"presents":[29],"learning-based":[31],"framework":[32],"that":[33,95],"uses":[34],"an":[35,74,89],"intermediate,":[36],"robot-centric":[37],"heightmap":[38],"representation.":[39],"A":[40],"hybrid":[41],"Encoder-Decoder":[42],"Structure":[43],"(EDS)":[44],"introduced,":[46],"utilizing":[47],"Convolutional":[49],"Neural":[50],"Network":[51],"(CNN)":[52],"spatial":[54],"feature":[55],"extraction":[56],"fused":[57],"with":[58],"Gated":[60],"Recurrent":[61],"Unit":[62],"(GRU)":[63],"core":[64],"temporal":[66,117],"consistency.":[67],"The":[68],"architecture":[69],"integrates":[70],"multimodal":[71,96],"data":[72],"from":[73],"Intel":[75],"RealSense":[76],"depth":[77],"camera,":[78],"LIVOX":[80],"MID-360":[81],"LiDAR":[82],"processed":[83],"via":[84],"efficient":[85],"spherical":[86],"projection,":[87],"and":[88,105],"onboard":[90],"IMU.":[91],"Quantitative":[92],"results":[93],"demonstrate":[94],"fusion":[97],"improves":[98],"reconstruction":[99],"accuracy":[100],"by":[101],"7.2%":[102],"over":[103,107],"depth-only":[104],"9.9%":[106],"LiDAR-only":[108],"configurations.":[109],"Furthermore,":[110],"integration":[112],"3.2":[115],"s":[116],"context":[118],"reduces":[119],"mapping":[120],"drift.":[121]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-07T00:00:00"}
