{"id":"https://openalex.org/W7133983534","doi":"https://doi.org/10.1007/s11370-026-00707-4","title":"Oracle-grasp: zero-shot affordance-aligned robotic grasping using large multimodal models","display_name":"Oracle-grasp: zero-shot affordance-aligned robotic grasping using large multimodal models","publication_year":2026,"publication_date":"2026-03-06","ids":{"openalex":"https://openalex.org/W7133983534","doi":"https://doi.org/10.1007/s11370-026-00707-4"},"language":"en","primary_location":{"id":"doi:10.1007/s11370-026-00707-4","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11370-026-00707-4","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11370-026-00707-4.pdf","source":{"id":"https://openalex.org/S145649206","display_name":"Intelligent Service Robotics","issn_l":"1861-2776","issn":["1861-2776","1861-2784"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Intelligent Service Robotics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s11370-026-00707-4.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128250045","display_name":"Avihai Giuili","orcid":null},"institutions":[{"id":"https://openalex.org/I16391192","display_name":"Tel Aviv University","ror":"https://ror.org/04mhzgx49","country_code":"IL","type":"education","lineage":["https://openalex.org/I16391192"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Avihai Giuili","raw_affiliation_strings":["School of Mechanical Engineering, Tel-Aviv University, 55 Chaim Lebanon St., 6997801, Tel-Aviv, Israel"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering, Tel-Aviv University, 55 Chaim Lebanon St., 6997801, Tel-Aviv, Israel","institution_ids":["https://openalex.org/I16391192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114658287","display_name":"Rotem Atari","orcid":null},"institutions":[{"id":"https://openalex.org/I16391192","display_name":"Tel Aviv University","ror":"https://ror.org/04mhzgx49","country_code":"IL","type":"education","lineage":["https://openalex.org/I16391192"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Rotem Atari","raw_affiliation_strings":["School of Mechanical Engineering, Tel-Aviv University, 55 Chaim Lebanon St., 6997801, Tel-Aviv, Israel"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering, Tel-Aviv University, 55 Chaim Lebanon St., 6997801, Tel-Aviv, Israel","institution_ids":["https://openalex.org/I16391192"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030565378","display_name":"Avishai Sintov","orcid":"https://orcid.org/0000-0002-3320-3897"},"institutions":[{"id":"https://openalex.org/I16391192","display_name":"Tel Aviv University","ror":"https://ror.org/04mhzgx49","country_code":"IL","type":"education","lineage":["https://openalex.org/I16391192"]}],"countries":["IL"],"is_corresponding":true,"raw_author_name":"Avishai Sintov","raw_affiliation_strings":["School of Mechanical Engineering, Tel-Aviv University, 55 Chaim Lebanon St., 6997801, Tel-Aviv, Israel"],"raw_orcid":"https://orcid.org/0000-0002-3320-3897","affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering, Tel-Aviv University, 55 Chaim Lebanon St., 6997801, Tel-Aviv, Israel","institution_ids":["https://openalex.org/I16391192"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5030565378"],"corresponding_institution_ids":["https://openalex.org/I16391192"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.47356263,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"19","issue":"3","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.8984000086784363,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.8984000086784363,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.03240000084042549,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.02449999935925007,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/grasp","display_name":"GRASP","score":0.9140999913215637},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5867999792098999},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5224000215530396},{"id":"https://openalex.org/keywords/service","display_name":"Service (business)","score":0.44119998812675476},{"id":"https://openalex.org/keywords/semantic-mapping","display_name":"Semantic mapping","score":0.39100000262260437},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.38760000467300415},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.3601999878883362},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.35519999265670776}],"concepts":[{"id":"https://openalex.org/C171268870","wikidata":"https://www.wikidata.org/wiki/Q1486676","display_name":"GRASP","level":2,"score":0.9140999913215637},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.885699987411499},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6212999820709229},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5867999792098999},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5224000215530396},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.46309998631477356},{"id":"https://openalex.org/C2780378061","wikidata":"https://www.wikidata.org/wiki/Q25351891","display_name":"Service (business)","level":2,"score":0.44119998812675476},{"id":"https://openalex.org/C2775955345","wikidata":"https://www.wikidata.org/wiki/Q7449071","display_name":"Semantic mapping","level":2,"score":0.39100000262260437},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.38760000467300415},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3601999878883362},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3553999960422516},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.35519999265670776},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.3522999882698059},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.3337000012397766},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.320499986410141},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.32010000944137573},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.2924000024795532},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.29100000858306885},{"id":"https://openalex.org/C64754055","wikidata":"https://www.wikidata.org/wiki/Q7574053","display_name":"Spatial contextual awareness","level":2,"score":0.2840999960899353},{"id":"https://openalex.org/C2776228582","wikidata":"https://www.wikidata.org/wiki/Q7455797","display_name":"Service robot","level":3,"score":0.28049999475479126},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.275299996137619},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2619999945163727},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.25690001249313354}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s11370-026-00707-4","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11370-026-00707-4","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11370-026-00707-4.pdf","source":{"id":"https://openalex.org/S145649206","display_name":"Intelligent Service Robotics","issn_l":"1861-2776","issn":["1861-2776","1861-2784"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Intelligent Service Robotics","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s11370-026-00707-4","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11370-026-00707-4","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11370-026-00707-4.pdf","source":{"id":"https://openalex.org/S145649206","display_name":"Intelligent Service Robotics","issn_l":"1861-2776","issn":["1861-2776","1861-2784"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Intelligent Service Robotics","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.48371049761772156}],"awards":[{"id":"https://openalex.org/G5324360481","display_name":null,"funder_award_id":"451/24","funder_id":"https://openalex.org/F4320322252","funder_display_name":"Israel Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320322252","display_name":"Israel Science Foundation","ror":"https://ror.org/04sazxf24"},{"id":"https://openalex.org/F4320322596","display_name":"Tel Aviv University","ror":"https://ror.org/04mhzgx49"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7133983534.pdf","grobid_xml":"https://content.openalex.org/works/W7133983534.grobid-xml"},"referenced_works_count":30,"referenced_works":["https://openalex.org/W1542761027","https://openalex.org/W2005824379","https://openalex.org/W2010274050","https://openalex.org/W2036637075","https://openalex.org/W2041376653","https://openalex.org/W2236233024","https://openalex.org/W2600030077","https://openalex.org/W2910474428","https://openalex.org/W2962736495","https://openalex.org/W2962793652","https://openalex.org/W2963033241","https://openalex.org/W2966615203","https://openalex.org/W3004103739","https://openalex.org/W4313026212","https://openalex.org/W4383108457","https://openalex.org/W4386599745","https://openalex.org/W4387092545","https://openalex.org/W4389666604","https://openalex.org/W4392646028","https://openalex.org/W4401019071","https://openalex.org/W4401415530","https://openalex.org/W4402670135","https://openalex.org/W4402702930","https://openalex.org/W4405785344","https://openalex.org/W4405786716","https://openalex.org/W4405910844","https://openalex.org/W4407637743","https://openalex.org/W4408555470","https://openalex.org/W4416747768","https://openalex.org/W7133196460"],"related_works":[],"abstract_inverted_index":{"Abstract":[0],"Grasping":[1],"unknown":[2],"objects":[3,62],"in":[4,17,28,209,227],"unstructured":[5],"environments":[6,30],"is":[7],"a":[8,68,98,104,172],"critical":[9],"challenge":[10],"for":[11,220,234],"service":[12,229],"robots,":[13,230],"which":[14,50],"must":[15],"operate":[16],"dynamic,":[18],"real-world":[19,210],"settings":[20],"such":[21],"as":[22,77,97],"homes,":[23],"hospitals,":[24],"and":[25,35,55,140,147,160,177,183,195,223],"warehouses.":[26],"Success":[27],"these":[29],"requires":[31],"both":[32,181],"semantic":[33,78],"understanding":[34],"spatial":[36,129],"reasoning.":[37],"Traditional":[38],"methods":[39],"often":[40],"rely":[41],"on":[42,171],"dense":[43],"training":[44,88],"datasets":[45],"or":[46,63,89,237],"detailed":[47],"geometric":[48],"modeling,":[49],"demand":[51],"extensive":[52,238],"data":[53],"collection":[54],"do":[56],"not":[57],"generalize":[58],"well":[59],"to":[60,80,144],"novel":[61],"affordances.":[64],"We":[65,168],"present":[66],"ORACLE-Grasp,":[67],"zero-shot":[69],"framework":[70],"that":[71,189,199],"leverages":[72],"large":[73],"multimodal":[74],"models":[75,236],"(LMMs)":[76],"oracles":[79],"guide":[81],"affordance-aligned":[82],"grasp":[83,95,149,156],"selection,":[84],"without":[85],"requiring":[86],"task-specific":[87],"manual":[90],"input.":[91],"The":[92,186],"system":[93],"reformulates":[94],"prediction":[96],"structured,":[99],"iterative":[100],"decision":[101],"process,":[102],"using":[103],"dual-prompt":[105],"tool-calling":[106],"strategy:":[107],"the":[108,116,123,128,135,216,232],"first":[109],"prompt":[110],"extracts":[111],"high-level":[112],"object":[113],"semantics,":[114],"while":[115],"second":[117],"identifies":[118],"graspable":[119],"regions":[120,139],"aligned":[121],"with":[122,202],"object\u2019s":[124],"function.":[125],"To":[126],"address":[127],"limitations":[130],"of":[131,175,218],"LMMs,":[132],"ORACLE-Grasp":[133,170],"discretizes":[134],"image":[136],"into":[137],"candidate":[138],"reasons":[141],"over":[142],"them":[143],"produce":[145],"human-like":[146],"context-sensitive":[148],"suggestions.":[150],"A":[151],"depth-based":[152],"refinement":[153],"step":[154],"improves":[155],"reliability":[157],"when":[158],"available,":[159],"an":[161],"early":[162],"stopping":[163],"mechanism":[164],"enhances":[165],"computational":[166],"efficiency.":[167],"evaluate":[169],"diverse":[173],"set":[174],"RGB":[176],"RGB-D":[178],"images":[179],"featuring":[180],"everyday":[182],"AI-generated":[184],"objects.":[185],"results":[187],"show":[188],"our":[190],"method":[191],"produces":[192],"physically":[193],"feasible":[194],"semantically":[196],"appropriate":[197],"grasps":[198],"align":[200],"closely":[201],"human":[203],"annotations,":[204],"achieving":[205],"high":[206],"success":[207],"rates":[208],"pick-up":[211],"tasks.":[212],"Our":[213],"findings":[214],"highlight":[215],"potential":[217],"LMMs":[219],"enabling":[221],"flexible":[222],"generalizable":[224],"grasping":[225],"strategies":[226],"autonomous":[228],"eliminating":[231],"need":[233],"object-specific":[235],"training.":[239]},"counts_by_year":[],"updated_date":"2026-03-07T13:37:22.277990","created_date":"2026-02-19T00:00:00"}
