{"id":"https://openalex.org/W6903351551","doi":"https://doi.org/10.1109/access.2025.3590646","title":"SN360: Semantic and Surface Normal Cascaded Multi-Task 360 Monocular Depth Estimation","display_name":"SN360: Semantic and Surface Normal Cascaded Multi-Task 360 Monocular Depth Estimation","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W6903351551","doi":"https://doi.org/10.1109/access.2025.3590646"},"language":"en","primary_location":{"id":"doi:10.1109/access.2025.3590646","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3590646","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2025.3590646","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Payal Mohadikar","orcid":"https://orcid.org/0009-0005-2616-7612"},"institutions":[{"id":"https://openalex.org/I76835614","display_name":"University of Missouri","ror":"https://ror.org/02ymw8z06","country_code":"US","type":"education","lineage":["https://openalex.org/I76835614"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Payal Mohadikar","raw_affiliation_strings":["Electrical Engineering and Computer Science, University of Missouri, Columbia, MO, USA"],"raw_orcid":"https://orcid.org/0009-0005-2616-7612","affiliations":[{"raw_affiliation_string":"Electrical Engineering and Computer Science, University of Missouri, Columbia, MO, USA","institution_ids":["https://openalex.org/I76835614"]}]},{"author_position":"last","author":{"id":null,"display_name":"Ye Duan","orcid":null},"institutions":[{"id":"https://openalex.org/I8078737","display_name":"Clemson University","ror":"https://ror.org/037s24f05","country_code":"US","type":"education","lineage":["https://openalex.org/I8078737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ye Duan","raw_affiliation_strings":["School of Computing, Clemson University, Clemson, SC, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computing, Clemson University, Clemson, SC, USA","institution_ids":["https://openalex.org/I8078737"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I76835614"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":1.0875,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.84407356,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"13","issue":null,"first_page":"127599","last_page":"127613"},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9642000198364258,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9642000198364258,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13114","display_name":"Image Processing Techniques and Applications","score":0.006899999920278788,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.0034000000450760126,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.6434999704360962},{"id":"https://openalex.org/keywords/panorama","display_name":"Panorama","score":0.5989000201225281},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5273000001907349},{"id":"https://openalex.org/keywords/distortion","display_name":"Distortion (music)","score":0.4788999855518341},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4546000063419342},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.448199987411499},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4323999881744385},{"id":"https://openalex.org/keywords/surface","display_name":"Surface (topology)","score":0.4255000054836273},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.4180999994277954},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.36809998750686646}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7961000204086304},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6743999719619751},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.6434999704360962},{"id":"https://openalex.org/C2780580889","wikidata":"https://www.wikidata.org/wiki/Q41363","display_name":"Panorama","level":2,"score":0.5989000201225281},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5968999862670898},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5273000001907349},{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.4788999855518341},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4546000063419342},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.448199987411499},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4323999881744385},{"id":"https://openalex.org/C2776799497","wikidata":"https://www.wikidata.org/wiki/Q484298","display_name":"Surface (topology)","level":2,"score":0.4255000054836273},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.4180999994277954},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.36809998750686646},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3619000017642975},{"id":"https://openalex.org/C142575187","wikidata":"https://www.wikidata.org/wiki/Q3358290","display_name":"Pyramid (geometry)","level":2,"score":0.35600000619888306},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.34209999442100525},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.33000001311302185},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3246000111103058},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.31779998540878296},{"id":"https://openalex.org/C118732077","wikidata":"https://www.wikidata.org/wiki/Q273176","display_name":"Normal","level":3,"score":0.3160000145435333},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3138999938964844},{"id":"https://openalex.org/C2779010991","wikidata":"https://www.wikidata.org/wiki/Q2720909","display_name":"Artifact (error)","level":2,"score":0.31220000982284546},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.30640000104904175},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.3034000098705292},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.2964000105857849},{"id":"https://openalex.org/C29081049","wikidata":"https://www.wikidata.org/wiki/Q1364242","display_name":"Image stitching","level":2,"score":0.29159998893737793},{"id":"https://openalex.org/C157157409","wikidata":"https://www.wikidata.org/wiki/Q909601","display_name":"Tangent space","level":2,"score":0.2906999886035919},{"id":"https://openalex.org/C24027999","wikidata":"https://www.wikidata.org/wiki/Q2176348","display_name":"Omnidirectional antenna","level":3,"score":0.2529999911785126},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.25189998745918274},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.251800000667572}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2025.3590646","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3590646","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:73039af9f997404ab4c09977009fae85","is_oa":true,"landing_page_url":"https://doaj.org/article/73039af9f997404ab4c09977009fae85","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 13, Pp 127599-127613 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2025.3590646","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3590646","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3969819623","display_name":null,"funder_award_id":"W911NF2120275","funder_id":"https://openalex.org/F4320338295","funder_display_name":"Army Research Laboratory"},{"id":"https://openalex.org/G6191752688","display_name":null,"funder_award_id":"CNS-2018850","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7457524330","display_name":null,"funder_award_id":"NIBIB-R01-EB02943","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320338295","display_name":"Army Research Laboratory","ror":"https://ror.org/011hc8f90"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W2074254947","https://openalex.org/W2104974755","https://openalex.org/W2117539524","https://openalex.org/W2125416623","https://openalex.org/W2194775991","https://openalex.org/W2787091153","https://openalex.org/W2796422723","https://openalex.org/W2895250390","https://openalex.org/W2895696451","https://openalex.org/W2954174912","https://openalex.org/W2962741876","https://openalex.org/W2963389277","https://openalex.org/W2963488291","https://openalex.org/W2963591054","https://openalex.org/W2964014680","https://openalex.org/W2964339842","https://openalex.org/W2969261403","https://openalex.org/W2999254410","https://openalex.org/W3020521460","https://openalex.org/W3034515714","https://openalex.org/W3034530552","https://openalex.org/W3034728336","https://openalex.org/W3090975042","https://openalex.org/W3092934936","https://openalex.org/W3126573238","https://openalex.org/W3128100213","https://openalex.org/W3175201472","https://openalex.org/W3215974962","https://openalex.org/W4226339983","https://openalex.org/W4292787284","https://openalex.org/W4294068640","https://openalex.org/W4312566889","https://openalex.org/W4313169545","https://openalex.org/W4313174897","https://openalex.org/W4383108211","https://openalex.org/W4385245566","https://openalex.org/W4386075497","https://openalex.org/W4402727901","https://openalex.org/W6631190155","https://openalex.org/W6726497184","https://openalex.org/W6733367512","https://openalex.org/W6744291033","https://openalex.org/W6753449277","https://openalex.org/W6757782795","https://openalex.org/W6759134542","https://openalex.org/W6769516661","https://openalex.org/W6853628691"],"related_works":[],"abstract_inverted_index":{"Omnidirectional":[0],"images":[1],"carry":[2],"comprehensive":[3],"scene":[4,21,30],"representation":[5],"and":[6,15,66,98,118,152,196,223,231],"are":[7],"widely":[8,34],"useful":[9],"for":[10,39,43],"applications":[11],"like":[12],"AR/VR,":[13],"robotics,":[14],"autonomous":[16],"driving":[17],"that":[18,129,160],"require":[19],"holistic":[20,91,137],"understanding.":[22],"Depth":[23],"estimation,":[24,199],"being":[25],"the":[26,46,88,102,114,162,191,208,237],"core":[27],"component":[28],"of":[29,90,193],"understanding,":[31],"has":[32],"been":[33],"researched,":[35],"achieving":[36],"significant":[37,215],"improvement":[38,216],"perspective":[40],"inputs.":[41],"However,":[42],"360":[44,105],"input,":[45],"methods":[47,74],"still":[48],"produce":[49,173],"low-quality,":[50],"globally":[51,243],"inconsistent":[52],"depths,":[53],"indicating":[54],"poor":[55],"generalization":[56],"ability":[57],"due":[58],"to":[59,81,95,112,135,172,185,189,205],"challenges":[60],"such":[61],"as":[62],"inherent":[63],"spherical":[64,83],"distortion":[65],"relatively":[67],"few":[68],"training":[69],"data.":[70],"Recent":[71],"state-of-the-art":[72],"(SOTA)":[73],"utilize":[75],"multiple":[76],"projected":[77],"distortionless":[78],"tangent":[79],"patches":[80],"mitigate":[82,113],"distortion,":[84],"but":[85],"they":[86],"lose":[87],"learning":[89],"contextual":[92],"information,":[93],"leading":[94],"global":[96,116,141],"discrepancies":[97],"merging":[99,119],"artifacts":[100],"in":[101,167,202,217],"final":[103,209],"merged-back":[104],"depths.":[106,176,246],"In":[107],"this":[108],"paper,":[109],"we":[110],"propose":[111],"existing":[115],"inconsistency":[117],"artifact":[120],"issue":[121],"via":[122,143],"a":[123,132,149],"new":[124],"initial":[125,182],"depth":[126,183,210],"estimation":[127,184],"network":[128],"directly":[130],"takes":[131],"panorama":[133],"image":[134],"learn":[136],"features":[138],"with":[139],"enhanced":[140],"awareness":[142],"latent":[144],"attention.":[145],"We":[146],"further":[147],"present":[148],"novel":[150],"semantic":[151,194],"surface":[153,197],"normal":[154,198],"cascaded":[155],"multi-task":[156,169],"model":[157],"agnostic":[158],"framework":[159],"mitigates":[161],"negative":[163],"transfer":[164],"effect":[165],"observed":[166],"current":[168],"360-depth":[170],"approaches,":[171],"fine-grained,":[174],"structure-detailed":[175],"Specifically,":[177],"our":[178],"approach":[179,213],"utilizes":[180],"an":[181],"simulate":[186],"RGBD":[187],"input":[188],"enhance":[190],"performance":[192],"segmentation":[195],"which":[200],"is,":[201],"turn,":[203],"leveraged":[204],"explicitly":[206],"guide":[207],"prediction.":[211],"Our":[212],"shows":[214],"Abs":[218],"Rel":[219],"by":[220,226],"19.62%,":[221],"21.45%,":[222],"zero-shot":[224],"depths":[225],"22.8%":[227],"using":[228],"real-world":[229],"Stanford2D3D":[230],"Matterport2D3D":[232],"benchmark":[233],"datasets,":[234],"respectively,":[235],"over":[236],"SOTA":[238],"while":[239],"producing":[240],"structurally":[241],"detailed":[242],"consistent":[244],"high-quality":[245]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
