{"id":"https://openalex.org/W4413925899","doi":"https://doi.org/10.1109/icra55743.2025.11127328","title":"Persistent Object Gaussian Splat (POGS) for Tracking Human and Robot Manipulation of Irregularly Shaped Objects","display_name":"Persistent Object Gaussian Splat (POGS) for Tracking Human and Robot Manipulation of Irregularly Shaped Objects","publication_year":2025,"publication_date":"2025-05-19","ids":{"openalex":"https://openalex.org/W4413925899","doi":"https://doi.org/10.1109/icra55743.2025.11127328"},"language":"en","primary_location":{"id":"doi:10.1109/icra55743.2025.11127328","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra55743.2025.11127328","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101440767","display_name":"Justin Yu","orcid":"https://orcid.org/0009-0006-3683-878X"},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Justin Yu","raw_affiliation_strings":["UC Berkeley (automation.berkeley.edu),The AUTOLab"],"affiliations":[{"raw_affiliation_string":"UC Berkeley (automation.berkeley.edu),The AUTOLab","institution_ids":["https://openalex.org/I134446601"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027622116","display_name":"Kush Hari","orcid":null},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kush Hari","raw_affiliation_strings":["UC Berkeley (automation.berkeley.edu),The AUTOLab"],"affiliations":[{"raw_affiliation_string":"UC Berkeley (automation.berkeley.edu),The AUTOLab","institution_ids":["https://openalex.org/I134446601"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091877215","display_name":"Karim El-Refai","orcid":"https://orcid.org/0000-0001-9538-143X"},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Karim El-Refai","raw_affiliation_strings":["UC Berkeley (automation.berkeley.edu),The AUTOLab"],"affiliations":[{"raw_affiliation_string":"UC Berkeley (automation.berkeley.edu),The AUTOLab","institution_ids":["https://openalex.org/I134446601"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Arnav Dalal","orcid":null},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Arnav Dalal","raw_affiliation_strings":["UC Berkeley (automation.berkeley.edu),The AUTOLab"],"affiliations":[{"raw_affiliation_string":"UC Berkeley (automation.berkeley.edu),The AUTOLab","institution_ids":["https://openalex.org/I134446601"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022467361","display_name":"Justin Kerr","orcid":"https://orcid.org/0000-0002-0536-4853"},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Justin Kerr","raw_affiliation_strings":["UC Berkeley (automation.berkeley.edu),The AUTOLab"],"affiliations":[{"raw_affiliation_string":"UC Berkeley (automation.berkeley.edu),The AUTOLab","institution_ids":["https://openalex.org/I134446601"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074509165","display_name":"Chung Min Kim","orcid":null},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chung Min Kim","raw_affiliation_strings":["UC Berkeley (automation.berkeley.edu),The AUTOLab"],"affiliations":[{"raw_affiliation_string":"UC Berkeley (automation.berkeley.edu),The AUTOLab","institution_ids":["https://openalex.org/I134446601"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020437483","display_name":"Richard K. Cheng","orcid":"https://orcid.org/0000-0001-5994-5998"},"institutions":[{"id":"https://openalex.org/I4391768151","display_name":"Toyota Research Institute","ror":"https://ror.org/04fpkc108","country_code":null,"type":"facility","lineage":["https://openalex.org/I4210125472","https://openalex.org/I4391768151"]}],"countries":[],"is_corresponding":false,"raw_author_name":"Richard Cheng","raw_affiliation_strings":["Toyota Research Institute,Los Altos,CA"],"affiliations":[{"raw_affiliation_string":"Toyota Research Institute,Los Altos,CA","institution_ids":["https://openalex.org/I4391768151"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009075844","display_name":"Muhammad Zubair Irshad","orcid":"https://orcid.org/0000-0002-1955-6194"},"institutions":[{"id":"https://openalex.org/I4391768151","display_name":"Toyota Research Institute","ror":"https://ror.org/04fpkc108","country_code":null,"type":"facility","lineage":["https://openalex.org/I4210125472","https://openalex.org/I4391768151"]}],"countries":[],"is_corresponding":false,"raw_author_name":"Muhammad Zubair Irshad","raw_affiliation_strings":["Toyota Research Institute,Los Altos,CA"],"affiliations":[{"raw_affiliation_string":"Toyota Research Institute,Los Altos,CA","institution_ids":["https://openalex.org/I4391768151"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010019244","display_name":"Ken Goldberg","orcid":"https://orcid.org/0000-0001-6747-9499"},"institutions":[{"id":"https://openalex.org/I134446601","display_name":"Berkeley College","ror":"https://ror.org/02xewxa75","country_code":"US","type":"education","lineage":["https://openalex.org/I134446601"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ken Goldberg","raw_affiliation_strings":["UC Berkeley (automation.berkeley.edu),The AUTOLab"],"affiliations":[{"raw_affiliation_string":"UC Berkeley (automation.berkeley.edu),The AUTOLab","institution_ids":["https://openalex.org/I134446601"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5101440767"],"corresponding_institution_ids":["https://openalex.org/I134446601"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.21374556,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"3211","last_page":"3218"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.8252000212669373,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.8252000212669373,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.7882000207901001,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.7775999903678894,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.7342987060546875},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.6282341480255127},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6142896413803101},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5950378179550171},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.5322171449661255},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5056147575378418},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.11153364181518555}],"concepts":[{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7342987060546875},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.6282341480255127},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6142896413803101},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5950378179550171},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.5322171449661255},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5056147575378418},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.11153364181518555},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra55743.2025.11127328","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra55743.2025.11127328","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W1956566774","https://openalex.org/W2285041431","https://openalex.org/W2980383450","https://openalex.org/W3134664367","https://openalex.org/W3190988267","https://openalex.org/W3207187156","https://openalex.org/W4200150166","https://openalex.org/W4221151978","https://openalex.org/W4221155806","https://openalex.org/W4225759270","https://openalex.org/W4226265017","https://openalex.org/W4281557677","https://openalex.org/W4285102336","https://openalex.org/W4312424618","https://openalex.org/W4378450585","https://openalex.org/W4383108296","https://openalex.org/W4383108895","https://openalex.org/W4385318467","https://openalex.org/W4385431115","https://openalex.org/W4386066287","https://openalex.org/W4390872744","https://openalex.org/W4399574574","https://openalex.org/W4400904825","https://openalex.org/W4401414715","https://openalex.org/W4401417061","https://openalex.org/W4402703038","https://openalex.org/W4402713101","https://openalex.org/W4402716032","https://openalex.org/W4402727529","https://openalex.org/W4402727915","https://openalex.org/W4402754209","https://openalex.org/W4402916615","https://openalex.org/W4404446913","https://openalex.org/W4405785623"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Tracking":[0],"and":[1,18,52,92,119,137,161],"manipulating":[2],"irregularly-shaped,":[3],"previously":[4],"unseen":[5],"objects":[6],"in":[7,15],"dynamic":[8],"environments":[9],"is":[10],"important":[11],"for":[12,34,111],"robotic":[13],"applications":[14],"manufacturing,":[16],"assembly,":[17],"logistics.":[19],"Recently":[20],"introduced":[21],"Gaussian":[22,41],"Splats":[23],"[1]":[24],"efficiently":[25],"model":[26],"object":[27,53,74,112,125,130,135,159],"geometry,":[28],"but":[29],"lack":[30],"persistent":[31],"state":[32],"estimation":[33],"taskoriented":[35],"manipulation.":[36],"We":[37],"present":[38],"Persistent":[39],"Object":[40],"Splat":[42],"(POGS),":[43],"a":[44,57,97],"system":[45],"that":[46,60],"embeds":[47],"semantics,":[48],"self-supervised":[49,107],"visual":[50],"features,":[51],"grouping":[54],"features":[55,110],"into":[56],"compact":[58],"representation":[59],"can":[61],"be":[62],"continuously":[63],"updated":[64],"to":[65,101,150,155],"estimate":[66],"the":[67],"pose":[68,113,126,144],"of":[69,84,148,165],"scanned":[70],"objects.":[71,85],"POGS":[72,95,115,152],"updates":[73],"states":[75],"without":[76],"requiring":[77],"expensive":[78],"rescanning":[79],"or":[80],"prior":[81],"CAD":[82],"models":[83],"After":[86],"an":[87],"initial":[88],"multi-view":[89],"scene":[90],"capture":[91],"training":[93],"phase,":[94],"uses":[96],"single":[98],"stereo":[99],"camera":[100],"integrate":[102],"depth":[103],"estimates":[104],"along":[105],"with":[106,133],"vision":[108],"encoder":[109],"estimation.":[114],"supports":[116],"grasping,":[117],"reorientation,":[118],"natural":[120],"language-driven":[121],"manipulation":[122],"by":[123],"refining":[124],"estimates,":[127],"facilitating":[128],"sequential":[129],"reset":[131],"operations":[132],"human-induced":[134],"perturbations":[136,147],"tool":[138,143,146,167],"servoing,":[139],"where":[140],"robots":[141],"recover":[142],"despite":[145],"up":[149,154],"30\u00b0.":[151],"achieves":[153],"12":[156],"consecutive":[157],"successful":[158],"resets":[160],"recovers":[162],"from":[163],"80%":[164],"in-grasp":[166],"perturbations.":[168]},"counts_by_year":[],"updated_date":"2026-04-17T18:11:37.981687","created_date":"2025-10-10T00:00:00"}
