{"id":"https://openalex.org/W4396819322","doi":"https://doi.org/10.1080/01691864.2024.2395926","title":"Open-set 3D semantic instance maps for vision language navigation \u2013 O3D-SIM","display_name":"Open-set 3D semantic instance maps for vision language navigation \u2013 O3D-SIM","publication_year":2024,"publication_date":"2024-08-29","ids":{"openalex":"https://openalex.org/W4396819322","doi":"https://doi.org/10.1080/01691864.2024.2395926"},"language":"en","primary_location":{"id":"doi:10.1080/01691864.2024.2395926","is_oa":false,"landing_page_url":"https://doi.org/10.1080/01691864.2024.2395926","pdf_url":null,"source":{"id":"https://openalex.org/S192584203","display_name":"Advanced Robotics","issn_l":"0169-1864","issn":["0169-1864","1568-5535"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advanced Robotics","raw_type":"journal-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2404.17922","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5092029436","display_name":"Laksh Nanwani","orcid":"https://orcid.org/0009-0008-6422-1749"},"institutions":[{"id":"https://openalex.org/I64189192","display_name":"International Institute of Information Technology, Hyderabad","ror":"https://ror.org/05f11g639","country_code":"IN","type":"education","lineage":["https://openalex.org/I64189192"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Laksh Nanwani","raw_affiliation_strings":["Robotics Research Center, International Institute of Information Technology, Hyderabad, India"],"raw_orcid":"https://orcid.org/0009-0008-6422-1749","affiliations":[{"raw_affiliation_string":"Robotics Research Center, International Institute of Information Technology, Hyderabad, India","institution_ids":["https://openalex.org/I64189192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102663272","display_name":"Kumaraditya Gupta","orcid":null},"institutions":[{"id":"https://openalex.org/I64189192","display_name":"International Institute of Information Technology, Hyderabad","ror":"https://ror.org/05f11g639","country_code":"IN","type":"education","lineage":["https://openalex.org/I64189192"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Kumaraditya Gupta","raw_affiliation_strings":["Robotics Research Center, International Institute of Information Technology, Hyderabad, India"],"raw_orcid":"https://orcid.org/0009-0007-4108-4342","affiliations":[{"raw_affiliation_string":"Robotics Research Center, International Institute of Information Technology, Hyderabad, India","institution_ids":["https://openalex.org/I64189192"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Aditya Mathur","orcid":"https://orcid.org/0009-0006-3007-8652"},"institutions":[{"id":"https://openalex.org/I64189192","display_name":"International Institute of Information Technology, Hyderabad","ror":"https://ror.org/05f11g639","country_code":"IN","type":"education","lineage":["https://openalex.org/I64189192"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Aditya Mathur","raw_affiliation_strings":["Robotics Research Center, International Institute of Information Technology, Hyderabad, India"],"raw_orcid":"https://orcid.org/0009-0006-3007-8652","affiliations":[{"raw_affiliation_string":"Robotics Research Center, International Institute of Information Technology, Hyderabad, India","institution_ids":["https://openalex.org/I64189192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101351930","display_name":"Swayam Agrawal","orcid":null},"institutions":[{"id":"https://openalex.org/I64189192","display_name":"International Institute of Information Technology, Hyderabad","ror":"https://ror.org/05f11g639","country_code":"IN","type":"education","lineage":["https://openalex.org/I64189192"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Swayam Agrawal","raw_affiliation_strings":["Robotics Research Center, International Institute of Information Technology, Hyderabad, India"],"raw_orcid":"https://orcid.org/0009-0001-6767-8612","affiliations":[{"raw_affiliation_string":"Robotics Research Center, International Institute of Information Technology, Hyderabad, India","institution_ids":["https://openalex.org/I64189192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014203520","display_name":"A. H. Abdul Hafez","orcid":"https://orcid.org/0000-0002-1908-5521"},"institutions":[{"id":"https://openalex.org/I4210154391","display_name":"Hasan Kalyoncu University","ror":"https://ror.org/054g2pw49","country_code":"TR","type":"education","lineage":["https://openalex.org/I4210154391"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"A. H. Abdul Hafez","raw_affiliation_strings":["Faculty of Engineering, Hasan Kalyoncu University, Gaziantep, Turkey"],"raw_orcid":"https://orcid.org/0000-0002-1908-5521","affiliations":[{"raw_affiliation_string":"Faculty of Engineering, Hasan Kalyoncu University, Gaziantep, Turkey","institution_ids":["https://openalex.org/I4210154391"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5037843540","display_name":"K. Madhava Krishna","orcid":null},"institutions":[{"id":"https://openalex.org/I64189192","display_name":"International Institute of Information Technology, Hyderabad","ror":"https://ror.org/05f11g639","country_code":"IN","type":"education","lineage":["https://openalex.org/I64189192"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"K. Madhava Krishna","raw_affiliation_strings":["Robotics Research Center, International Institute of Information Technology, Hyderabad, India"],"raw_orcid":"https://orcid.org/0000-0001-7846-7901","affiliations":[{"raw_affiliation_string":"Robotics Research Center, International Institute of Information Technology, Hyderabad, India","institution_ids":["https://openalex.org/I64189192"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5092029436"],"corresponding_institution_ids":["https://openalex.org/I64189192"],"apc_list":null,"apc_paid":null,"fwci":0.4762,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.60788574,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":"38","issue":"19-20","first_page":"1378","last_page":"1391"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9700000286102295,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9700000286102295,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.944100022315979,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9380999803543091,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6810677647590637},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5793464779853821},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5548704862594604},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.43611517548561096},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.43268972635269165},{"id":"https://openalex.org/keywords/open-set","display_name":"Open set","score":0.4234585165977478},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.17550262808799744},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11049443483352661},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.05994617938995361}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6810677647590637},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5793464779853821},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5548704862594604},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.43611517548561096},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.43268972635269165},{"id":"https://openalex.org/C42357961","wikidata":"https://www.wikidata.org/wiki/Q213363","display_name":"Open set","level":2,"score":0.4234585165977478},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.17550262808799744},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11049443483352661},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.05994617938995361}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1080/01691864.2024.2395926","is_oa":false,"landing_page_url":"https://doi.org/10.1080/01691864.2024.2395926","pdf_url":null,"source":{"id":"https://openalex.org/S192584203","display_name":"Advanced Robotics","issn_l":"0169-1864","issn":["0169-1864","1568-5535"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advanced Robotics","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2404.17922","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.17922","pdf_url":"https://arxiv.org/pdf/2404.17922","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:openaccess.hku.edu.tr:20.500.11782/4443","is_oa":true,"landing_page_url":"https://doi.org/10.1080/01691864.2024.2395926.","pdf_url":null,"source":{"id":"https://openalex.org/S4306401159","display_name":"Hasan Kalyoncu University Institutional Repository (Hasan Kalyoncu University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210154391","host_organization_name":"Hasan Kalyoncu University","host_organization_lineage":["https://openalex.org/I4210154391"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2404.17922","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.17922","pdf_url":"https://arxiv.org/pdf/2404.17922","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.7200000286102295,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320332009","display_name":"International Institute of Information Technology, Hyderabad","ror":null}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4396819322.pdf"},"referenced_works_count":33,"referenced_works":["https://openalex.org/W2153054365","https://openalex.org/W2963150697","https://openalex.org/W2963800628","https://openalex.org/W2964339842","https://openalex.org/W2999219213","https://openalex.org/W3009928773","https://openalex.org/W3034500398","https://openalex.org/W3172675210","https://openalex.org/W3205276578","https://openalex.org/W4200150166","https://openalex.org/W4210320874","https://openalex.org/W4220736817","https://openalex.org/W4236147647","https://openalex.org/W4252907012","https://openalex.org/W4285224875","https://openalex.org/W4312815172","https://openalex.org/W4312938887","https://openalex.org/W4327662982","https://openalex.org/W4366208220","https://openalex.org/W4383108296","https://openalex.org/W4383108807","https://openalex.org/W4383108895","https://openalex.org/W4383109211","https://openalex.org/W4385431115","https://openalex.org/W4386065347","https://openalex.org/W4386066594","https://openalex.org/W4388624206","https://openalex.org/W4390874575","https://openalex.org/W4399375990","https://openalex.org/W4401414715","https://openalex.org/W4402354030","https://openalex.org/W4402917081","https://openalex.org/W4404612908"],"related_works":["https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2772917594","https://openalex.org/W2775347418","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Humans":[0],"excel":[1],"at":[2],"forming":[3],"mental":[4],"maps":[5,36],"of":[6,66,142,191],"their":[7],"surroundings,":[8],"equipping":[9],"them":[10],"to":[11,81,154,169,180],"understand":[12],"object":[13,100],"relationships":[14],"and":[15,49,62,88,91,104,159,164,166],"navigate":[16],"based":[17],"on":[18,47],"language":[19,39,130,165],"queries.":[20],"Our":[21,94],"previous":[22],"work":[23,136],"SI":[24],"Maps":[25],"(Nanwani":[26],"L,":[27],"Agarwal":[28],"A,":[29],"Jain":[30],"K,":[31],"et":[32],"al.":[33],"Instance-level":[34],"semantic":[35,64,126],"for":[37,73,99],"vision":[38],"navigation.":[40],"In:":[41],"2023":[42,55],"32nd":[43],"IEEE":[44],"International":[45],"Conference":[46],"Robot":[48],"Human":[50],"Interactive":[51],"Communication":[52],"(RO-MAN).":[53],"IEEE;":[54],"Aug.)":[56],"showed":[57],"that":[58,111,128],"having":[59],"instance-level":[60,79,120],"information":[61],"the":[63,85,125,135,139,146,152,161],"understanding":[65,127],"an":[67],"environment":[68],"helps":[69],"significantly":[70],"improve":[71],"performance":[72],"language-guided":[74,143],"tasks.":[75,144],"We":[76,107],"extend":[77],"this":[78],"approach":[80,176],"3D":[82,115],"while":[83],"increasing":[84],"pipeline&apos;s":[86],"robustness":[87],"improving":[89],"quantitative":[90],"qualitative":[92],"results.":[93],"method":[95],"leverages":[96],"foundational":[97,162],"models":[98,163],"recognition,":[101],"image":[102],"segmentation,":[103],"feature":[105],"extraction.":[106],"propose":[108],"a":[109,114,174],"representation":[110],"results":[112],"in":[113,124],"point":[116],"cloud":[117],"map":[118],"with":[119],"embeddings,":[121],"which":[122],"bring":[123],"natural":[129],"commands":[131],"can":[132],"query.":[133],"Quantitatively,":[134],"improves":[137],"upon":[138],"success":[140],"rate":[141],"At":[145],"same":[147],"time,":[148],"we":[149],"qualitatively":[150],"observe":[151],"ability":[153],"identify":[155,170],"instances":[156],"more":[157],"clearly":[158],"leverage":[160],"image-aligned":[167],"embeddings":[168],"objects":[171],"that,":[172],"otherwise,":[173],"closed-set":[175],"wouldn&apos;t":[177],"be":[178],"able":[179],"identify.":[181],"Project":[182],"Page":[183],"-":[184],"https://smart-wheelchair-rrc.github.io/o3d-sim-webpage.":[185],"\u00a9":[186],"2024":[187],"The":[188],"Robotics":[189],"Society":[190],"Japan.":[192]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
