{"id":"https://openalex.org/W4413945067","doi":"https://doi.org/10.1109/icra55743.2025.11127739","title":"Cage: Causal Attention Enables Data-Efficient Generalizable Robotic Manipulation","display_name":"Cage: Causal Attention Enables Data-Efficient Generalizable Robotic Manipulation","publication_year":2025,"publication_date":"2025-05-19","ids":{"openalex":"https://openalex.org/W4413945067","doi":"https://doi.org/10.1109/icra55743.2025.11127739"},"language":"en","primary_location":{"id":"doi:10.1109/icra55743.2025.11127739","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra55743.2025.11127739","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5076676248","display_name":"Shangning Xia","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shangning Xia","raw_affiliation_strings":["Shanghai Jiao Tong University,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045458030","display_name":"Hongjie Fang","orcid":"https://orcid.org/0000-0002-6309-1160"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongjie Fang","raw_affiliation_strings":["Shanghai Jiao Tong University,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010726528","display_name":"Cewu Lu","orcid":"https://orcid.org/0009-0003-7254-9318"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cewu Lu","raw_affiliation_strings":["Shanghai Jiao Tong University,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077175165","display_name":"Haoshu Fang","orcid":"https://orcid.org/0000-0003-3108-6305"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hao-Shu Fang","raw_affiliation_strings":["Shanghai Jiao Tong University,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5076676248"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":5.5813,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.95967694,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"13242","last_page":"13249"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9850999712944031,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9850999712944031,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12002","display_name":"Computability, Logic, AI Algorithms","score":0.9620000123977661,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9574000239372253,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6796890497207642},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4549545347690582},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.4521614611148834}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6796890497207642},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4549545347690582},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4521614611148834}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra55743.2025.11127739","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra55743.2025.11127739","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1817111062","display_name":null,"funder_award_id":"2022ZD0160102","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W1901129140","https://openalex.org/W2194775991","https://openalex.org/W2625366777","https://openalex.org/W2760103357","https://openalex.org/W3034891989","https://openalex.org/W3145450063","https://openalex.org/W3159481202","https://openalex.org/W3205786327","https://openalex.org/W3207758636","https://openalex.org/W3214952050","https://openalex.org/W4312933868","https://openalex.org/W4313156423","https://openalex.org/W4382366145","https://openalex.org/W4385245566","https://openalex.org/W4385403811","https://openalex.org/W4385430674","https://openalex.org/W4385430679","https://openalex.org/W4390872441","https://openalex.org/W4390874575","https://openalex.org/W4401415042","https://openalex.org/W4401415650","https://openalex.org/W4401416041","https://openalex.org/W4401417423","https://openalex.org/W4402353986","https://openalex.org/W4402354045","https://openalex.org/W4402354047","https://openalex.org/W4402354112","https://openalex.org/W4402354127","https://openalex.org/W4405785353"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Generalization":[0],"in":[1,105,121,141,149,167,179],"robotic":[2,23],"manipulation":[3,24,123],"remains":[4],"a":[5,21,67,75,93,156,162,170],"critical":[6],"challenge,":[7],"particularly":[8],"when":[9],"scaling":[10],"to":[11,27,81,154],"new":[12],"environments":[13],"with":[14,38,56,79],"limited":[15],"demonstrations.":[16],"This":[17],"paper":[18],"introduces":[19],"CAGE,":[20],"novel":[22],"policy":[25,64],"designed":[26],"overcome":[28],"these":[29],"generalization":[30,100],"barriers":[31],"by":[32],"integrating":[33],"the":[34,44,50,174],"pretrained":[35],"visual":[36,103],"representation":[37],"causal":[39,68],"attention":[40,80],"mechanism.":[41],"CAGE":[42,97,114,133,152],"utilizes":[43],"powerful":[45],"feature":[46],"extraction":[47],"capabilities":[48],"of":[49,137,177],"vision":[51],"foundation":[52],"model":[53],"DINOv2,":[54],"combined":[55],"LoRA":[57],"fine-tuning":[58],"for":[59,70],"robust":[60,99],"environment":[61],"understanding.":[62],"The":[63],"further":[65],"employs":[66],"perceiver":[69],"effective":[71],"token":[72],"compression":[73],"and":[74,108,161],"diffusion-based":[76],"action":[77],"head":[78],"enhance":[82],"task-specific":[83],"fine-grained":[84],"conditioning.":[85],"With":[86],"as":[87,89],"few":[88],"50":[90],"demonstrations":[91],"from":[92],"single":[94],"training":[95],"environment,":[96],"achieves":[98],"across":[101],"diverse":[102],"changes":[104],"objects,":[106],"backgrounds,":[107],"viewpoints.":[109],"Extensive":[110],"experiments":[111],"validate":[112],"that":[113],"significantly":[115],"outperforms":[116],"existing":[117],"state-of-the-art":[118],"RGB/RGB-D-based":[119],"approaches":[120],"various":[122],"tasks,":[124],"especially":[125],"under":[126],"large":[127],"distribution":[128],"shifts.":[129],"In":[130],"similar":[131],"environments,":[132,151],"offers":[134],"an":[135],"average":[136],"42":[138],"%":[139,158,164],"increase":[140],"task":[142],"completion":[143,159],"rate.":[144],"While":[145],"all":[146],"baselines":[147],"fail":[148],"unseen":[150],"manages":[153],"obtain":[155],"43":[157],"rate":[160,166],"51":[163],"success":[165],"average,":[168],"marking":[169],"substantial":[171],"advancement":[172],"toward":[173],"practical":[175],"deployment":[176],"robots":[178],"real-world":[180],"settings.":[181],"Project":[182],"website:":[183],"cage-policy.github.io.":[184]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-01T08:55:55.761014","created_date":"2025-10-10T00:00:00"}
