{"id":"https://openalex.org/W4306295016","doi":"https://doi.org/10.48550/arxiv.2210.06601","title":"Generalization with Lossy Affordances: Leveraging Broad Offline Data for Learning Visuomotor Tasks","display_name":"Generalization with Lossy Affordances: Leveraging Broad Offline Data for Learning Visuomotor Tasks","publication_year":2022,"publication_date":"2022-10-12","ids":{"openalex":"https://openalex.org/W4306295016","doi":"https://doi.org/10.48550/arxiv.2210.06601"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2210.06601","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2210.06601","pdf_url":"https://arxiv.org/pdf/2210.06601","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2210.06601","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113787478","display_name":"Kuan Fang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Fang, Kuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030238910","display_name":"Patrick Yin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yin, Patrick","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021472921","display_name":"Ashvin Nair","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nair, Ashvin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064208112","display_name":"Homer Walke","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Walke, Homer","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051491635","display_name":"Gengchen Yan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan, Gengchen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5026322200","display_name":"Sergey Levine","orcid":"https://orcid.org/0000-0001-6764-2743"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Levine, Sergey","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5113787478"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9894000291824341,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9865999817848206,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/affordance","display_name":"Affordance","score":0.8450874090194702},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7862240076065063},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7368239164352417},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.7217769026756287},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.7065741419792175},{"id":"https://openalex.org/keywords/lossy-compression","display_name":"Lossy compression","score":0.6917957067489624},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5923455953598022},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5785230398178101},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.5173420310020447},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.46960529685020447},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.46141016483306885},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.45833662152290344}],"concepts":[{"id":"https://openalex.org/C194995250","wikidata":"https://www.wikidata.org/wiki/Q531136","display_name":"Affordance","level":2,"score":0.8450874090194702},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7862240076065063},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7368239164352417},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.7217769026756287},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.7065741419792175},{"id":"https://openalex.org/C165021410","wikidata":"https://www.wikidata.org/wiki/Q55564","display_name":"Lossy compression","level":2,"score":0.6917957067489624},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5923455953598022},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5785230398178101},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5173420310020447},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.46960529685020447},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.46141016483306885},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.45833662152290344},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2210.06601","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2210.06601","pdf_url":"https://arxiv.org/pdf/2210.06601","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2210.06601","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2210.06601","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2210.06601","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2210.06601","pdf_url":"https://arxiv.org/pdf/2210.06601","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W1972718289","https://openalex.org/W1791514435","https://openalex.org/W2346831895","https://openalex.org/W2248634132","https://openalex.org/W3049116993","https://openalex.org/W1541884709","https://openalex.org/W2589081601","https://openalex.org/W2226037301","https://openalex.org/W2026855223","https://openalex.org/W2070708245"],"abstract_inverted_index":{"The":[0],"utilization":[1],"of":[2,16,24,93,161],"broad":[3,61,109],"datasets":[4,160],"has":[5],"proven":[6],"to":[7,20,89,141],"be":[8,156],"crucial":[9],"for":[10,12,28,51,134,170],"generalization":[11],"a":[13,34,45,79,91,138],"wide":[14],"range":[15],"fields.":[17],"However,":[18],"how":[19],"effectively":[21],"make":[22],"use":[23],"diverse":[25],"multi-task":[26],"data":[27],"novel":[29,80,171],"downstream":[30],"tasks":[31,55],"still":[32],"remains":[33],"grand":[35],"challenge":[36],"in":[37,63,71],"robotics.":[38],"To":[39],"tackle":[40],"this":[41],"challenge,":[42],"we":[43],"introduce":[44],"framework":[46,84,154],"that":[47,98,126,152],"acquires":[48],"goal-conditioned":[49],"policies":[50],"unseen":[52,135],"temporally":[53],"extended":[54],"via":[56],"offline":[57],"reinforcement":[58],"learning":[59],"on":[60,158],"data,":[62,110],"combination":[64],"with":[65,78],"online":[66],"fine-tuning":[67],"guided":[68],"by":[69],"subgoals":[70,97],"learned":[72],"lossy":[73,94,112],"representation":[74,113],"space.":[75],"When":[76],"faced":[77],"task":[81,102],"goal,":[82],"the":[83,100,108,111,142],"uses":[85],"an":[86],"affordance":[87],"model":[88],"plan":[90],"sequence":[92],"representations":[95],"as":[96],"decomposes":[99],"original":[101],"into":[103],"easier":[104],"problems.":[105],"Learned":[106],"from":[107,164,174],"emphasizes":[114],"task-relevant":[115],"information":[116],"about":[117],"states":[118],"and":[119,144,167],"goals":[120],"while":[121],"abstracting":[122],"away":[123],"redundant":[124],"contexts":[125],"hinder":[127],"generalization.":[128],"It":[129],"thus":[130],"enables":[131],"subgoal":[132],"planning":[133],"tasks,":[136,172],"provides":[137],"compact":[139],"input":[140],"policy,":[143],"facilitates":[145],"reward":[146,180],"shaping":[147],"during":[148],"fine-tuning.":[149],"We":[150],"show":[151],"our":[153],"can":[155],"pre-trained":[157],"large-scale":[159],"robot":[162],"experiences":[163],"prior":[165],"work":[166],"efficiently":[168],"fine-tuned":[169],"entirely":[173],"visual":[175],"inputs":[176],"without":[177],"any":[178],"manual":[179],"engineering.":[181]},"counts_by_year":[],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2022-10-15T00:00:00"}
