{"id":"https://openalex.org/W3004133887","doi":"https://doi.org/10.1109/iros40897.2019.8967761","title":"Continuous Relaxation of Symbolic Planner for One-Shot Imitation Learning","display_name":"Continuous Relaxation of Symbolic Planner for One-Shot Imitation Learning","publication_year":2019,"publication_date":"2019-11-01","ids":{"openalex":"https://openalex.org/W3004133887","doi":"https://doi.org/10.1109/iros40897.2019.8967761","mag":"3004133887"},"language":"en","primary_location":{"id":"doi:10.1109/iros40897.2019.8967761","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros40897.2019.8967761","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052829033","display_name":"De-An Huang","orcid":"https://orcid.org/0000-0002-6945-7768"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"De-An Huang","raw_affiliation_strings":["Computer Science Department, Stanford University, 353 Serra Mall, Stanford, CA, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Stanford University, 353 Serra Mall, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028834865","display_name":"Danfei Xu","orcid":"https://orcid.org/0000-0002-8744-3861"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Danfei Xu","raw_affiliation_strings":["Computer Science Department, Stanford University, 353 Serra Mall, Stanford, CA, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Stanford University, 353 Serra Mall, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030826237","display_name":"Yuke Zhu","orcid":"https://orcid.org/0000-0002-9198-2227"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yuke Zhu","raw_affiliation_strings":["Computer Science Department, Stanford University, 353 Serra Mall, Stanford, CA, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Stanford University, 353 Serra Mall, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061193324","display_name":"Animesh Garg","orcid":"https://orcid.org/0000-0003-0482-4296"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Animesh Garg","raw_affiliation_strings":["Computer Science Department, Stanford University, 353 Serra Mall, Stanford, CA, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Stanford University, 353 Serra Mall, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042646536","display_name":"Silvio Savarese","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Silvio Savarese","raw_affiliation_strings":["Computer Science Department, Stanford University, 353 Serra Mall, Stanford, CA, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Stanford University, 353 Serra Mall, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100450462","display_name":"Li Fei-Fei","orcid":"https://orcid.org/0000-0002-7481-0810"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Li Fei-Fei","raw_affiliation_strings":["Computer Science Department, Stanford University, 353 Serra Mall, Stanford, CA, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Stanford University, 353 Serra Mall, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5018518655","display_name":"Juan Carlos Niebles","orcid":"https://orcid.org/0000-0001-8225-9793"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Juan Carlos Niebles","raw_affiliation_strings":["Computer Science Department, Stanford University, 353 Serra Mall, Stanford, CA, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science Department, Stanford University, 353 Serra Mall, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5052829033"],"corresponding_institution_ids":["https://openalex.org/I97018004"],"apc_list":null,"apc_paid":null,"fwci":1.6195,"has_fulltext":false,"cited_by_count":23,"citation_normalized_percentile":{"value":0.87527953,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"2635","last_page":"2642"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9876999855041504,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.776202917098999},{"id":"https://openalex.org/keywords/planner","display_name":"Planner","score":0.7398506999015808},{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.6651073098182678},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.625940203666687},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6152413487434387},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6040390133857727},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5817405581474304},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5281336903572083},{"id":"https://openalex.org/keywords/symbol","display_name":"Symbol (formal)","score":0.47274813055992126},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.45124930143356323},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4479571580886841},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.34714406728744507},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.09779015183448792},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09596079587936401},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08355700969696045}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.776202917098999},{"id":"https://openalex.org/C2776999362","wikidata":"https://www.wikidata.org/wiki/Q2349274","display_name":"Planner","level":2,"score":0.7398506999015808},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.6651073098182678},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.625940203666687},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6152413487434387},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6040390133857727},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5817405581474304},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5281336903572083},{"id":"https://openalex.org/C134400042","wikidata":"https://www.wikidata.org/wiki/Q2372244","display_name":"Symbol (formal)","level":2,"score":0.47274813055992126},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.45124930143356323},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4479571580886841},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.34714406728744507},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.09779015183448792},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09596079587936401},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08355700969696045},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros40897.2019.8967761","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros40897.2019.8967761","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6399999856948853,"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W127341816","https://openalex.org/W1515891729","https://openalex.org/W1594698162","https://openalex.org/W1977970897","https://openalex.org/W2063471043","https://openalex.org/W2081476395","https://openalex.org/W2111027756","https://openalex.org/W2116039916","https://openalex.org/W2128459535","https://openalex.org/W2138501114","https://openalex.org/W2144913588","https://openalex.org/W2152232000","https://openalex.org/W2168359464","https://openalex.org/W2222874733","https://openalex.org/W2243242557","https://openalex.org/W2402990501","https://openalex.org/W2601322194","https://openalex.org/W2604763608","https://openalex.org/W2755546070","https://openalex.org/W2785948534","https://openalex.org/W2793380548","https://openalex.org/W2908470496","https://openalex.org/W2962732055","https://openalex.org/W2963094133","https://openalex.org/W2963341924","https://openalex.org/W2963703448","https://openalex.org/W2964021598","https://openalex.org/W2964055695","https://openalex.org/W2964118342","https://openalex.org/W2968227116","https://openalex.org/W2979490629","https://openalex.org/W3144080979","https://openalex.org/W6605199526","https://openalex.org/W6678993419","https://openalex.org/W6688576433","https://openalex.org/W6690608649","https://openalex.org/W6713200026","https://openalex.org/W6717697761","https://openalex.org/W6735944222","https://openalex.org/W6736057607","https://openalex.org/W6747769025","https://openalex.org/W6749986616","https://openalex.org/W6754777436"],"related_works":["https://openalex.org/W4387497383","https://openalex.org/W3183948672","https://openalex.org/W3173606202","https://openalex.org/W3110381201","https://openalex.org/W2948807893","https://openalex.org/W2935909890","https://openalex.org/W2778153218","https://openalex.org/W2758277628","https://openalex.org/W1531601525","https://openalex.org/W2047027848"],"abstract_inverted_index":{"We":[0,108],"address":[1,109],"one-shot":[2,54,160],"imitation":[3,55,161],"learning,":[4],"where":[5],"the":[6,31,43,46,64,71,75,90,118,126,130,138,143,147,155,159],"goal":[7],"is":[8,51,88,93],"to":[9,52,80,95,103],"execute":[10],"a":[11,17,35,58,114],"previously":[12],"unseen":[13],"task":[14],"based":[15],"on":[16,125],"single":[18],"demonstration.":[19],"While":[20],"there":[21],"has":[22],"been":[23],"exciting":[24],"progress":[25],"in":[26,146],"this":[27,110],"direction,":[28],"most":[29],"of":[30,45,117,129,137],"approaches":[32],"still":[33,141],"require":[34],"few":[36],"hundred":[37],"tasks":[38,163],"for":[39,158],"meta-training,":[40],"which":[41],"limits":[42],"scalability":[44],"approaches.":[47],"Our":[48,134],"main":[49],"contribution":[50],"formulate":[53],"learning":[56,162],"as":[57],"symbolic":[59,105,120],"planning":[60,106],"problem":[61],"along":[62],"with":[63,97],"symbol":[65,91,131,149],"grounding":[66,92,132,150],"problem.":[67],"This":[68],"formulation":[69],"disentangles":[70],"policy":[72],"execution":[73],"from":[74],"inter-task":[76],"generalization":[77],"and":[78,101,151],"leads":[79,102],"better":[81],"data":[82,100],"efficiency.":[83],"The":[84],"key":[85],"technical":[86],"challenge":[87,111],"that":[89,122],"prone":[94],"error":[96],"limited":[98],"training":[99,167],"subsequent":[104],"failures.":[107],"by":[112],"proposing":[113],"continuous":[115,135],"relaxation":[116,136],"discrete":[119],"planner":[121,139,157],"directly":[123],"plans":[124],"probabilistic":[127,148],"outputs":[128],"model.":[133],"can":[140],"leverage":[142],"information":[144],"contained":[145],"significantly":[152],"improve":[153],"over":[154],"baseline":[156],"without":[164],"using":[165],"large":[166],"data.":[168]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
