{"id":"https://openalex.org/W4383108839","doi":"https://doi.org/10.1109/icra48891.2023.10160946","title":"Learning to View: Decision Transformers for Active Object Detection","display_name":"Learning to View: Decision Transformers for Active Object Detection","publication_year":2023,"publication_date":"2023-05-29","ids":{"openalex":"https://openalex.org/W4383108839","doi":"https://doi.org/10.1109/icra48891.2023.10160946"},"language":"en","primary_location":{"id":"doi:10.1109/icra48891.2023.10160946","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra48891.2023.10160946","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058280572","display_name":"Wenhao Ding","orcid":"https://orcid.org/0000-0003-3218-8792"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Wenhao Ding","raw_affiliation_strings":["Amazon Lab126,Sunnyvale,CA,USA,94098","Carnegie Mellon University, Pittsburgh, PA, USA"],"affiliations":[{"raw_affiliation_string":"Amazon Lab126,Sunnyvale,CA,USA,94098","institution_ids":[]},{"raw_affiliation_string":"Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024265021","display_name":"Nathalie Majcherczyk","orcid":"https://orcid.org/0000-0001-6888-1826"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nathalie Majcherczyk","raw_affiliation_strings":["Amazon Lab126,Sunnyvale,CA,USA,94098"],"affiliations":[{"raw_affiliation_string":"Amazon Lab126,Sunnyvale,CA,USA,94098","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109620159","display_name":"Mohit Deshpande","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mohit Deshpande","raw_affiliation_strings":["Amazon Lab126,Sunnyvale,CA,USA,94098"],"affiliations":[{"raw_affiliation_string":"Amazon Lab126,Sunnyvale,CA,USA,94098","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101906245","display_name":"Xuewei Qi","orcid":"https://orcid.org/0000-0003-3890-135X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xuewei Qi","raw_affiliation_strings":["Amazon Lab126,Sunnyvale,CA,USA,94098"],"affiliations":[{"raw_affiliation_string":"Amazon Lab126,Sunnyvale,CA,USA,94098","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037644321","display_name":"Ding Zhao","orcid":"https://orcid.org/0000-0002-9400-8446"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ding Zhao","raw_affiliation_strings":["Carnegie Mellon University,Pittsburgh,PA,USA,15213"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,Pittsburgh,PA,USA,15213","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056472890","display_name":"Rajasimman Madhivanan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rajasimman Madhivanan","raw_affiliation_strings":["Amazon Lab126,Sunnyvale,CA,USA,94098"],"affiliations":[{"raw_affiliation_string":"Amazon Lab126,Sunnyvale,CA,USA,94098","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053890173","display_name":"Arnie Sen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Arnie Sen","raw_affiliation_strings":["Amazon Lab126,Sunnyvale,CA,USA,94098"],"affiliations":[{"raw_affiliation_string":"Amazon Lab126,Sunnyvale,CA,USA,94098","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5058280572"],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":2.6185,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.91673143,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"7140","last_page":"7146"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9868999719619751,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8007938861846924},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.7314251661300659},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6876885890960693},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6130092144012451},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5934762954711914},{"id":"https://openalex.org/keywords/active-perception","display_name":"Active perception","score":0.5550695061683655},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5190116167068481},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.5079882740974426},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4971330463886261},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.47975409030914307},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3277214765548706},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.144840270280838},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12903261184692383}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8007938861846924},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.7314251661300659},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6876885890960693},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6130092144012451},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5934762954711914},{"id":"https://openalex.org/C2776010242","wikidata":"https://www.wikidata.org/wiki/Q4677575","display_name":"Active perception","level":3,"score":0.5550695061683655},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5190116167068481},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.5079882740974426},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4971330463886261},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.47975409030914307},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3277214765548706},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.144840270280838},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12903261184692383},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra48891.2023.10160946","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra48891.2023.10160946","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.6000000238418579,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":59,"referenced_works":["https://openalex.org/W2108598243","https://openalex.org/W2119717200","https://openalex.org/W2593769898","https://openalex.org/W2736601468","https://openalex.org/W2807052771","https://openalex.org/W2899771611","https://openalex.org/W2904246096","https://openalex.org/W2907503094","https://openalex.org/W2919115771","https://openalex.org/W2962732398","https://openalex.org/W2966306124","https://openalex.org/W2981900248","https://openalex.org/W3009584650","https://openalex.org/W3016525976","https://openalex.org/W3022566517","https://openalex.org/W3030520226","https://openalex.org/W3033324992","https://openalex.org/W3046735138","https://openalex.org/W3130718496","https://openalex.org/W3143776122","https://openalex.org/W3163842339","https://openalex.org/W3169291081","https://openalex.org/W3205794883","https://openalex.org/W4207072548","https://openalex.org/W4221146510","https://openalex.org/W4226151089","https://openalex.org/W4226435594","https://openalex.org/W4281668117","https://openalex.org/W4286225098","https://openalex.org/W4286892762","https://openalex.org/W4287126489","https://openalex.org/W4287756699","https://openalex.org/W4293566037","https://openalex.org/W4298857966","https://openalex.org/W4312291425","https://openalex.org/W4360584316","https://openalex.org/W4385245566","https://openalex.org/W6637967152","https://openalex.org/W6739901393","https://openalex.org/W6741002519","https://openalex.org/W6747106673","https://openalex.org/W6757592117","https://openalex.org/W6774583691","https://openalex.org/W6776438516","https://openalex.org/W6776601253","https://openalex.org/W6778485988","https://openalex.org/W6779265984","https://openalex.org/W6779656125","https://openalex.org/W6792413472","https://openalex.org/W6796289742","https://openalex.org/W6802659552","https://openalex.org/W6802916882","https://openalex.org/W6804244202","https://openalex.org/W6804404469","https://openalex.org/W6810466897","https://openalex.org/W6810669889","https://openalex.org/W6810745647","https://openalex.org/W6839185451","https://openalex.org/W6841247348"],"related_works":["https://openalex.org/W4362501864","https://openalex.org/W4306904969","https://openalex.org/W4380318855","https://openalex.org/W2138720691","https://openalex.org/W2031695474","https://openalex.org/W2586732548","https://openalex.org/W3049728571","https://openalex.org/W20361778","https://openalex.org/W2024136090","https://openalex.org/W116417374"],"abstract_inverted_index":{"Active":[0],"perception":[1,12,34],"describes":[2],"a":[3,19,59,114,126],"broad":[4],"class":[5],"of":[6,38,84,147,182],"techniques":[7],"that":[8,80,105,163],"couple":[9],"planning":[10,68],"and":[11,73,130,172,186],"systems":[13],"to":[14,21,61,69,77,96,102],"move":[15,74],"the":[16,23,28,52,63,75,82,85,98,107,123,133,141,145,183],"robot":[17,24,76,99],"in":[18,100,140],"way":[20],"give":[22],"more":[25],"information":[26],"about":[27],"environment.":[29,142],"In":[30,87],"most":[31],"robotic":[32],"systems,":[33],"is":[35,46],"typically":[36],"independent":[37],"motion":[39],"planning.":[40],"For":[41],"example,":[42],"traditional":[43],"object":[44],"detection":[45,71,108],"passive:":[47],"it":[48,54],"operates":[49],"only":[50],"on":[51,150],"images":[53,104],"receives.":[55],"However,":[56],"we":[57,66,90,111],"have":[58],"chance":[60],"improve":[62],"results":[64,161],"if":[65],"allow":[67],"consume":[70],"signals":[72],"collect":[78],"views":[79],"maximize":[81,106],"quality":[83],"results.":[86],"this":[88],"paper,":[89],"use":[91],"reinforcement":[92],"learning":[93],"(RL)":[94],"methods":[95],"control":[97],"order":[101],"obtain":[103],"quality.":[109],"Specifically,":[110],"propose":[112],"using":[113],"Decision":[115],"Transformer":[116],"with":[117,125],"online":[118],"fine-tuning,":[119],"which":[120],"first":[121],"optimizes":[122],"policy":[124,135,171],"pre-collected":[127],"expert":[128,170],"dataset":[129,153],"then":[131],"improves":[132],"learned":[134],"by":[136],"exploring":[137],"better":[138],"solutions":[139],"We":[143,177],"evaluate":[144],"performance":[146],"proposed":[148],"method":[149,165],"an":[151,156],"interactive":[152],"collected":[154],"from":[155],"indoor":[157],"scenario":[158],"simulator.":[159],"Experimental":[160],"demonstrate":[162],"our":[164],"outperforms":[166],"all":[167],"baselines,":[168],"including":[169],"pure":[173],"offline":[174],"RL":[175],"methods.":[176],"also":[178],"provide":[179],"exhaustive":[180],"analyses":[181],"reward":[184],"distribution":[185],"observation":[187],"space.":[188]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":9}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
