{"id":"https://openalex.org/W4413925281","doi":"https://doi.org/10.1109/icra55743.2025.11128679","title":"A Parameter-Efficient Tuning Framework for Language-Guided Object Grounding and Robot Grasping","display_name":"A Parameter-Efficient Tuning Framework for Language-Guided Object Grounding and Robot Grasping","publication_year":2025,"publication_date":"2025-05-19","ids":{"openalex":"https://openalex.org/W4413925281","doi":"https://doi.org/10.1109/icra55743.2025.11128679"},"language":"en","primary_location":{"id":"doi:10.1109/icra55743.2025.11128679","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra55743.2025.11128679","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088122096","display_name":"Houjian Yu","orcid":"https://orcid.org/0000-0001-8869-5078"},"institutions":[{"id":"https://openalex.org/I130238516","display_name":"University of Minnesota","ror":"https://ror.org/017zqws13","country_code":"US","type":"education","lineage":["https://openalex.org/I130238516"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Houjian Yu","raw_affiliation_strings":["Univ. of Minnesota,Department of Electrical and Computer Engineering,Minneapolis,USA"],"affiliations":[{"raw_affiliation_string":"Univ. of Minnesota,Department of Electrical and Computer Engineering,Minneapolis,USA","institution_ids":["https://openalex.org/I130238516"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083948436","display_name":"Mingen Li","orcid":null},"institutions":[{"id":"https://openalex.org/I130238516","display_name":"University of Minnesota","ror":"https://ror.org/017zqws13","country_code":"US","type":"education","lineage":["https://openalex.org/I130238516"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mingen Li","raw_affiliation_strings":["Univ. of Minnesota,Department of Electrical and Computer Engineering,Minneapolis,USA"],"affiliations":[{"raw_affiliation_string":"Univ. of Minnesota,Department of Electrical and Computer Engineering,Minneapolis,USA","institution_ids":["https://openalex.org/I130238516"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088480186","display_name":"Alireza Rezazadeh","orcid":"https://orcid.org/0000-0002-2457-9470"},"institutions":[{"id":"https://openalex.org/I130238516","display_name":"University of Minnesota","ror":"https://ror.org/017zqws13","country_code":"US","type":"education","lineage":["https://openalex.org/I130238516"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alireza Rezazadeh","raw_affiliation_strings":["Univ. of Minnesota,Department of Electrical and Computer Engineering,Minneapolis,USA"],"affiliations":[{"raw_affiliation_string":"Univ. of Minnesota,Department of Electrical and Computer Engineering,Minneapolis,USA","institution_ids":["https://openalex.org/I130238516"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100397589","display_name":"Yang Yang","orcid":"https://orcid.org/0000-0002-4134-901X"},"institutions":[{"id":"https://openalex.org/I130238516","display_name":"University of Minnesota","ror":"https://ror.org/017zqws13","country_code":"US","type":"education","lineage":["https://openalex.org/I130238516"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yang Yang","raw_affiliation_strings":["Univ. of Minnesota,Department of Computer Science and Engineering,Minneapolis,USA"],"affiliations":[{"raw_affiliation_string":"Univ. of Minnesota,Department of Computer Science and Engineering,Minneapolis,USA","institution_ids":["https://openalex.org/I130238516"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057994317","display_name":"Changhyun Choi","orcid":"https://orcid.org/0000-0003-4715-3576"},"institutions":[{"id":"https://openalex.org/I130238516","display_name":"University of Minnesota","ror":"https://ror.org/017zqws13","country_code":"US","type":"education","lineage":["https://openalex.org/I130238516"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Changhyun Choi","raw_affiliation_strings":["Univ. of Minnesota,Department of Electrical and Computer Engineering,Minneapolis,USA"],"affiliations":[{"raw_affiliation_string":"Univ. of Minnesota,Department of Electrical and Computer Engineering,Minneapolis,USA","institution_ids":["https://openalex.org/I130238516"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5088122096"],"corresponding_institution_ids":["https://openalex.org/I130238516"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.3513301,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"14353","last_page":"14360"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13382","display_name":"Robotics and Automated Systems","score":0.9912999868392944,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13382","display_name":"Robotics and Automated Systems","score":0.9912999868392944,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9879999756813049,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9793999791145325,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ground","display_name":"Ground","score":0.745036780834198},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7069278955459595},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.701298713684082},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.6599288582801819},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.47424548864364624},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4581637978553772},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.19085636734962463},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.16221535205841064}],"concepts":[{"id":"https://openalex.org/C168993435","wikidata":"https://www.wikidata.org/wiki/Q6501125","display_name":"Ground","level":2,"score":0.745036780834198},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7069278955459595},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.701298713684082},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.6599288582801819},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.47424548864364624},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4581637978553772},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.19085636734962463},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.16221535205841064}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra55743.2025.11128679","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra55743.2025.11128679","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4595098722","display_name":null,"funder_award_id":"2143730","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W1505952289","https://openalex.org/W2082511574","https://openalex.org/W2194775991","https://openalex.org/W2251512949","https://openalex.org/W2302548814","https://openalex.org/W2560647685","https://openalex.org/W2918333121","https://openalex.org/W2962875890","https://openalex.org/W2963109634","https://openalex.org/W2964284374","https://openalex.org/W2964345792","https://openalex.org/W3093025045","https://openalex.org/W3137905681","https://openalex.org/W3171007011","https://openalex.org/W3174770825","https://openalex.org/W3176770340","https://openalex.org/W3198377975","https://openalex.org/W3201770677","https://openalex.org/W3205613184","https://openalex.org/W3205684050","https://openalex.org/W3216551675","https://openalex.org/W4200631575","https://openalex.org/W4280533594","https://openalex.org/W4285102435","https://openalex.org/W4312543911","https://openalex.org/W4312615341","https://openalex.org/W4383108836","https://openalex.org/W4389665522","https://openalex.org/W4389666604","https://openalex.org/W4389667112","https://openalex.org/W4389667691","https://openalex.org/W4389667706","https://openalex.org/W4390830078","https://openalex.org/W4390871886","https://openalex.org/W4390873528","https://openalex.org/W4402702930","https://openalex.org/W4403488721","https://openalex.org/W4405078890","https://openalex.org/W4405786114"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"The":[0],"language-guided":[1,69],"robot":[2,7,120],"grasping":[3,73,121],"task":[4,133],"requires":[5],"a":[6,57,97,110],"agent":[8],"to":[9,19,118],"integrate":[10],"multimodal":[11,61,103],"information":[12],"from":[13],"both":[14],"visual":[15],"and":[16,41,50,72,85,109,146],"linguistic":[17],"inputs":[18,104],"predict":[20],"actions":[21],"for":[22,67,105,167],"target-driven":[23],"grasping.":[24],"While":[25],"recent":[26],"approaches":[27],"utilizing":[28],"Multimodal":[29],"Large":[30],"Language":[31],"Models":[32],"(MLLMs)":[33],"have":[34],"shown":[35],"promising":[36],"results,":[37],"their":[38],"extensive":[39],"computation":[40],"data":[42],"demands":[43],"limit":[44],"the":[45,129,144,180],"feasibility":[46],"of":[47],"local":[48],"deployment":[49],"customization.":[51],"To":[52],"address":[53],"this,":[54],"we":[55],"propose":[56],"novel":[58],"CLIP-based":[59,137],"[1]":[60],"parameter-efficient":[62],"tuning":[63,139],"(PET)":[64],"framework":[65],"designed":[66],"three":[68],"object":[70,131,155],"grounding":[71,132],"tasks:":[74],"(1)":[75],"Referring":[76,81,87],"Expression":[77],"Segmentation":[78],"(RES),":[79],"(2)":[80],"Grasp":[82,88],"Synthesis":[83],"(RGS),":[84],"(3)":[86],"Affordance":[89],"(RGA).":[90],"Our":[91],"approach":[92],"introduces":[93],"two":[94],"key":[95],"innovations:":[96],"bi-directional":[98],"vision-language":[99],"adapter":[100],"that":[101,114],"aligns":[102],"pixel-level":[106],"language":[107,160],"understanding":[108],"depth":[111],"fusion":[112],"branch":[113],"incorporates":[115],"geometric":[116],"cues":[117],"facilitate":[119],"predictions.":[122],"Experiment":[123],"results":[124],"demonstrate":[125],"superior":[126],"performance":[127],"in":[128,179],"RES":[130],"compared":[134],"with":[135],"existing":[136],"full-model":[138],"or":[140],"PET":[141],"approaches.":[142],"In":[143],"RGS":[145],"RGA":[147],"tasks,":[148],"our":[149],"model":[150],"not":[151],"only":[152],"effectively":[153],"interprets":[154],"attributes":[156],"based":[157],"on":[158],"simple":[159],"descriptions":[161],"but":[162],"also":[163],"shows":[164],"strong":[165],"potential":[166],"comprehending":[168],"complex":[169],"spatial":[170],"reasoning":[171],"scenarios,":[172],"such":[173],"as":[174],"multiple":[175],"identical":[176],"objects":[177],"present":[178],"workspace.":[181],"Project":[182],"page:":[183],"https://z.umn.edu/etog-etrg":[184]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
