{"id":"https://openalex.org/W4414165700","doi":"https://doi.org/10.1109/access.2025.3607672","title":"Semantic Object Navigation With Segmenting Decision Transformer","display_name":"Semantic Object Navigation With Segmenting Decision Transformer","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4414165700","doi":"https://doi.org/10.1109/access.2025.3607672"},"language":"en","primary_location":{"id":"doi:10.1109/access.2025.3607672","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3607672","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2025.3607672","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009170866","display_name":"Aleksei Staroverov","orcid":"https://orcid.org/0000-0002-4730-1543"},"institutions":[{"id":"https://openalex.org/I193710463","display_name":"Zhukovsky Air Force Engineering Academy","ror":"https://ror.org/00y1a8425","country_code":"RU","type":"education","lineage":["https://openalex.org/I193710463"]}],"countries":["RU"],"is_corresponding":false,"raw_author_name":"Aleksei Staroverov","raw_affiliation_strings":["AIRI, Moscow, Russia","AIRI, 32 Kutuzovsky Ave, Moscow, Russia"],"raw_orcid":"https://orcid.org/0000-0002-4730-1543","affiliations":[{"raw_affiliation_string":"AIRI, Moscow, Russia","institution_ids":[]},{"raw_affiliation_string":"AIRI, 32 Kutuzovsky Ave, Moscow, Russia","institution_ids":["https://openalex.org/I193710463"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058209276","display_name":"Tatiana Zemskova","orcid":"https://orcid.org/0000-0003-4271-7336"},"institutions":[{"id":"https://openalex.org/I193710463","display_name":"Zhukovsky Air Force Engineering Academy","ror":"https://ror.org/00y1a8425","country_code":"RU","type":"education","lineage":["https://openalex.org/I193710463"]}],"countries":["RU"],"is_corresponding":false,"raw_author_name":"Tatiana Zemskova","raw_affiliation_strings":["AIRI, Moscow, Russia","AIRI, 32 Kutuzovsky Ave, Moscow, Russia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AIRI, Moscow, Russia","institution_ids":[]},{"raw_affiliation_string":"AIRI, 32 Kutuzovsky Ave, Moscow, Russia","institution_ids":["https://openalex.org/I193710463"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025655729","display_name":"Dmitry Yudin","orcid":"https://orcid.org/0000-0002-1407-2633"},"institutions":[{"id":"https://openalex.org/I193710463","display_name":"Zhukovsky Air Force Engineering Academy","ror":"https://ror.org/00y1a8425","country_code":"RU","type":"education","lineage":["https://openalex.org/I193710463"]}],"countries":["RU"],"is_corresponding":false,"raw_author_name":"Dmitry A. Yudin","raw_affiliation_strings":["AIRI, Moscow, Russia","AIRI, 32 Kutuzovsky Ave, Moscow, Russia"],"raw_orcid":"https://orcid.org/0000-0002-1407-2633","affiliations":[{"raw_affiliation_string":"AIRI, Moscow, Russia","institution_ids":[]},{"raw_affiliation_string":"AIRI, 32 Kutuzovsky Ave, Moscow, Russia","institution_ids":["https://openalex.org/I193710463"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5080806360","display_name":"Aleksandr I. Panov","orcid":"https://orcid.org/0000-0002-9747-3837"},"institutions":[{"id":"https://openalex.org/I193710463","display_name":"Zhukovsky Air Force Engineering Academy","ror":"https://ror.org/00y1a8425","country_code":"RU","type":"education","lineage":["https://openalex.org/I193710463"]}],"countries":["RU"],"is_corresponding":false,"raw_author_name":"Aleksandr I. Panov","raw_affiliation_strings":["AIRI, Moscow, Russia","AIRI, 32 Kutuzovsky Ave, Moscow, Russia"],"raw_orcid":"https://orcid.org/0000-0002-9747-3837","affiliations":[{"raw_affiliation_string":"AIRI, Moscow, Russia","institution_ids":[]},{"raw_affiliation_string":"AIRI, 32 Kutuzovsky Ave, Moscow, Russia","institution_ids":["https://openalex.org/I193710463"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I193710463"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.11117781,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"13","issue":null,"first_page":"162807","last_page":"162820"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9732000231742859,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9732000231742859,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13382","display_name":"Robotics and Automated Systems","score":0.9291999936103821,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9229999780654907,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6992999911308289},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4424999952316284},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.413100004196167},{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.3783000111579895},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.36649999022483826},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.3513000011444092},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.3402000069618225},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.2969000041484833}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8708999752998352},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6992999911308289},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6051999926567078},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4424999952316284},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.44200000166893005},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.413100004196167},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.3783000111579895},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.36649999022483826},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.352400004863739},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.3513000011444092},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.3402000069618225},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3138999938964844},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2969000041484833},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.2962999939918518},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2865000069141388},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.2858000099658966},{"id":"https://openalex.org/C125308379","wikidata":"https://www.wikidata.org/wiki/Q363057","display_name":"Market segmentation","level":2,"score":0.28369998931884766},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.28360000252723694},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.2667999863624573},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.2639000117778778},{"id":"https://openalex.org/C25694479","wikidata":"https://www.wikidata.org/wiki/Q7446278","display_name":"Segmentation-based object categorization","level":5,"score":0.2581999897956848},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.25690001249313354},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2567000091075897}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2025.3607672","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3607672","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:3beb8d2424dd4ab9b795ea7e85903ac9","is_oa":true,"landing_page_url":"https://doaj.org/article/3beb8d2424dd4ab9b795ea7e85903ac9","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 13, Pp 162807-162820 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2025.3607672","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3607672","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Object":[0],"navigation":[1,26,59,83,183],"remains":[2],"a":[3,47,62,100,118,139,143],"fundamental":[4],"challenge":[5],"in":[6,124,191],"robotics,":[7],"particularly":[8],"when":[9],"agents":[10],"must":[11],"reach":[12],"targets":[13],"specified":[14],"by":[15,110,189],"semantic":[16,23,55,145,157],"categories.":[17],"While":[18],"existing":[19],"approaches":[20],"often":[21],"treat":[22],"understanding":[24],"and":[25,58,82,96,148],"as":[27],"separate":[28],"components,":[29],"we":[30],"demonstrate":[31,128],"that":[32,50,70,129,163],"their":[33],"tight":[34],"coupling":[35],"is":[36,69,203],"crucial":[37],"for":[38],"robust":[39],"performance.":[40],"We":[41],"present":[42],"SegDT":[43,130,185,202],"(Segmenting":[44],"Decision":[45],"Transformer),":[46],"novel":[48],"architecture":[49],"jointly":[51],"learns":[52],"to":[53,195],"predict":[54],"segmentation":[56,80,136,146,169],"masks":[57],"actions":[60],"through":[61,114],"unified":[63],"transformer-based":[64,91],"model.":[65],"Our":[66,159],"key":[67],"insight":[68],"temporal":[71,165],"information":[72],"from":[73,117],"sequential":[74],"observations":[75],"can":[76],"simultaneously":[77],"enhance":[78],"both":[79],"quality":[81],"decisions.":[84],"To":[85],"address":[86],"the":[87,125,150,172,196],"inherent":[88],"challenges":[89],"of":[90,152,175,201],"navigation\u2014notably":[92],"poor":[93],"sample":[94],"efficiency":[95,193],"computational":[97],"complexity\u2014we":[98],"introduce":[99],"two-phase":[101],"training":[102],"approach:":[103],"offline":[104],"pretraining":[105],"on":[106],"expert":[107],"demonstrations":[108],"followed":[109],"online":[111],"policy":[112],"refinement":[113],"knowledge":[115],"transfer":[116],"recurrent":[119],"neural":[120],"network.":[121],"Extensive":[122],"experiments":[123],"Habitat":[126],"simulator":[127],"achieves":[131],"higher":[132],"results":[133],"using":[134,154],"predicted":[135],"masks,":[137],"outperforming":[138],"single-frame":[140],"baseline":[141],"with":[142],"pre-trained":[144],"model":[147],"approaching":[149],"performance":[151,188],"systems":[153],"ground":[155],"truth":[156],"information.":[158],"ablation":[160],"studies":[161],"reveal":[162],"SegDT\u2019s":[164],"processing":[166],"also":[167],"improves":[168],"quality,":[170],"highlighting":[171],"synergistic":[173],"benefits":[174],"joint":[176],"optimization.":[177],"When":[178],"integrated":[179],"into":[180],"complete":[181],"object":[182],"systems,":[184],"enhances":[186],"overall":[187],"9.6%":[190],"path":[192],"compared":[194],"state-of-the-art":[197],"method.":[198],"The":[199],"code":[200],"made":[204],"publicly":[205],"available":[206],"at":[207],"<uri":[208],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[209],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">https://github.com/CognitiveAISystems/SegDT</uri>":[210]},"counts_by_year":[],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
