{"id":"https://openalex.org/W4406603720","doi":"https://doi.org/10.48550/arxiv.2501.09783","title":"GeoManip: Geometric Constraints as General Interfaces for Robot Manipulation","display_name":"GeoManip: Geometric Constraints as General Interfaces for Robot Manipulation","publication_year":2025,"publication_date":"2025-01-16","ids":{"openalex":"https://openalex.org/W4406603720","doi":"https://doi.org/10.48550/arxiv.2501.09783"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2501.09783","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.09783","pdf_url":"https://arxiv.org/pdf/2501.09783","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2501.09783","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5034309002","display_name":"Weiliang Tang","orcid":"https://orcid.org/0009-0007-5794-858X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Tang, Weiliang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023225646","display_name":"Jiahui Pan","orcid":"https://orcid.org/0000-0002-7576-6743"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan, Jia-Hui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100707660","display_name":"Yunhui Liu","orcid":"https://orcid.org/0000-0002-3625-6679"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Yun-Hui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064077634","display_name":"Masayoshi Tomizuka","orcid":"https://orcid.org/0000-0003-0206-6639"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tomizuka, Masayoshi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053710007","display_name":"Li Erran Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Li Erran","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054382056","display_name":"Chi\u2010Wing Fu","orcid":"https://orcid.org/0000-0002-5238-593X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fu, Chi-Wing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5022382771","display_name":"Mingyu Ding","orcid":"https://orcid.org/0000-0001-6556-8359"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ding, Mingyu","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5034309002"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11159","display_name":"Manufacturing Process and Optimization","score":0.8934999704360962,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11159","display_name":"Manufacturing Process and Optimization","score":0.8934999704360962,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6160456538200378},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.573750913143158},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.48709845542907715},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2634328305721283}],"concepts":[{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6160456538200378},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.573750913143158},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.48709845542907715},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2634328305721283}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2501.09783","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.09783","pdf_url":"https://arxiv.org/pdf/2501.09783","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2501.09783","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2501.09783","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2501.09783","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.09783","pdf_url":"https://arxiv.org/pdf/2501.09783","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320322942","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48"},{"id":"https://openalex.org/F4320329815","display_name":"Hong Kong Government","ror":"https://ror.org/034179816"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4406603720.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"We":[0],"present":[1],"GeoManip,":[2],"a":[3,33,97,107],"framework":[4],"to":[5,9,32,44,123],"enable":[6],"generalist":[7],"robots":[8],"leverage":[10],"essential":[11],"conditions":[12],"derived":[13],"from":[14,127,148,152],"object":[15,112],"and":[16,56,69,81,106,130,137,158,170],"part":[17],"relationships,":[18],"as":[19],"geometric":[20,34,104],"constraints,":[21],"for":[22,162],"robot":[23],"manipulation.":[24],"For":[25],"example,":[26],"cutting":[27],"the":[28,36,39,45,64,131],"carrot":[29],"requires":[30],"adhering":[31],"constraint:":[35],"blade":[37],"of":[38],"knife":[40],"should":[41],"be":[42],"perpendicular":[43],"carrot's":[46],"direction.":[47],"By":[48],"interpreting":[49],"these":[50,116],"constraints":[51,105,126],"through":[52],"symbolic":[53],"language":[54,68],"representations":[55],"translating":[57],"them":[58],"into":[59],"low-level":[60],"actions,":[61],"GeoManip":[62,134],"bridges":[63],"gap":[65],"between":[66],"natural":[67],"robotic":[70],"execution,":[71],"enabling":[72],"greater":[73],"generalizability":[74],"across":[75],"diverse":[76],"even":[77],"unseen":[78],"tasks,":[79],"objects,":[80],"scenarios.":[82],"Unlike":[83],"vision-language-action":[84],"models":[85],"that":[86,101,110],"require":[87],"extensive":[88],"training,":[89],"operates":[90],"training-free":[91],"by":[92],"utilizing":[93],"large":[94],"foundational":[95],"models:":[96],"constraint":[98],"generation":[99],"module":[100],"predicts":[102],"stage-specific":[103],"geometry":[108],"parser":[109],"identifies":[111],"parts":[113],"involved":[114],"in":[115],"constraints.":[117],"A":[118],"solver":[119],"then":[120],"optimizes":[121],"trajectories":[122],"satisfy":[124],"inferred":[125],"task":[128],"descriptions":[129],"scene.":[132],"Furthermore,":[133],"learns":[135],"in-context":[136],"provides":[138],"five":[139],"appealing":[140],"human-robot":[141],"interaction":[142],"features:":[143],"on-the-fly":[144],"policy":[145],"adaptation,":[146],"learning":[147,151],"human":[149],"demonstrations,":[150],"failure":[153],"cases,":[154],"long-horizon":[155],"action":[156],"planning,":[157],"efficient":[159],"data":[160],"collection":[161],"imitation":[163],"learning.":[164],"Extensive":[165],"evaluations":[166],"on":[167],"both":[168],"simulations":[169],"real-world":[171],"scenarios":[172],"demonstrate":[173],"GeoManip's":[174],"state-of-the-art":[175],"performance,":[176],"with":[177],"superior":[178],"out-of-distribution":[179],"generalization":[180],"while":[181],"avoiding":[182],"costly":[183],"model":[184],"training.":[185]},"counts_by_year":[],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
