{"id":"https://openalex.org/W7126087654","doi":"https://doi.org/10.1109/comcomap68359.2025.11353140","title":"A Survey of Physical AI: Foundations in OpenUSD, GR00T, VLMs, and the NVIDIA Omniverse Ecosystem","display_name":"A Survey of Physical AI: Foundations in OpenUSD, GR00T, VLMs, and the NVIDIA Omniverse Ecosystem","publication_year":2025,"publication_date":"2025-12-14","ids":{"openalex":"https://openalex.org/W7126087654","doi":"https://doi.org/10.1109/comcomap68359.2025.11353140"},"language":null,"primary_location":{"id":"doi:10.1109/comcomap68359.2025.11353140","is_oa":false,"landing_page_url":"https://doi.org/10.1109/comcomap68359.2025.11353140","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Computing, Communications and IoT Applications (ComComAp)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5124250877","display_name":"Sebastian Caballero-Roa","orcid":null},"institutions":[{"id":"https://openalex.org/I2613432","display_name":"University of South Florida","ror":"https://ror.org/032db5x82","country_code":"US","type":"education","lineage":["https://openalex.org/I2613432"]},{"id":"https://openalex.org/I75821886","display_name":"University of South Florida St. Petersburg","ror":"https://ror.org/016gp6x28","country_code":"US","type":"education","lineage":["https://openalex.org/I75821886"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sebastian Caballero-Roa","raw_affiliation_strings":["Univ. of South Florida,FL,USA"],"affiliations":[{"raw_affiliation_string":"Univ. of South Florida,FL,USA","institution_ids":["https://openalex.org/I2613432","https://openalex.org/I75821886"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5117416065","display_name":"Juan Mart\u00ednez-P\u00e1ez","orcid":null},"institutions":[{"id":"https://openalex.org/I2613432","display_name":"University of South Florida","ror":"https://ror.org/032db5x82","country_code":"US","type":"education","lineage":["https://openalex.org/I2613432"]},{"id":"https://openalex.org/I75821886","display_name":"University of South Florida St. Petersburg","ror":"https://ror.org/016gp6x28","country_code":"US","type":"education","lineage":["https://openalex.org/I75821886"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Juan Martinez-Paez","raw_affiliation_strings":["Univ. of South Florida,FL,USA"],"affiliations":[{"raw_affiliation_string":"Univ. of South Florida,FL,USA","institution_ids":["https://openalex.org/I2613432","https://openalex.org/I75821886"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121372861","display_name":"Mohamed Rahouti","orcid":null},"institutions":[{"id":"https://openalex.org/I164389053","display_name":"Fordham University","ror":"https://ror.org/03qnxaf80","country_code":"US","type":"education","lineage":["https://openalex.org/I164389053"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mohamed Rahouti","raw_affiliation_strings":["Fordham Univ,NY,USA"],"affiliations":[{"raw_affiliation_string":"Fordham Univ,NY,USA","institution_ids":["https://openalex.org/I164389053"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023985430","display_name":"Nasir Abdul Ghani","orcid":null},"institutions":[{"id":"https://openalex.org/I2613432","display_name":"University of South Florida","ror":"https://ror.org/032db5x82","country_code":"US","type":"education","lineage":["https://openalex.org/I2613432"]},{"id":"https://openalex.org/I75821886","display_name":"University of South Florida St. Petersburg","ror":"https://ror.org/016gp6x28","country_code":"US","type":"education","lineage":["https://openalex.org/I75821886"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nasir Ghani","raw_affiliation_strings":["Univ. of South Florida,FL,USA"],"affiliations":[{"raw_affiliation_string":"Univ. of South Florida,FL,USA","institution_ids":["https://openalex.org/I2613432","https://openalex.org/I75821886"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5124250877"],"corresponding_institution_ids":["https://openalex.org/I2613432","https://openalex.org/I75821886"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.72223507,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"221","last_page":"227"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.12150000035762787,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.12150000035762787,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11883","display_name":"Embodied and Extended Cognition","score":0.061400000005960464,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.05950000137090683,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5060999989509583},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.43950000405311584},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.42179998755455017},{"id":"https://openalex.org/keywords/embodied-cognition","display_name":"Embodied cognition","score":0.4131999909877777},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.4090000092983246},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.36419999599456787}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5942999720573425},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5060999989509583},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.4399000108242035},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.43950000405311584},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.42179998755455017},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.414900004863739},{"id":"https://openalex.org/C100609095","wikidata":"https://www.wikidata.org/wiki/Q1335050","display_name":"Embodied cognition","level":2,"score":0.4131999909877777},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.4090000092983246},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.4052000045776367},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.36419999599456787},{"id":"https://openalex.org/C194969405","wikidata":"https://www.wikidata.org/wiki/Q170519","display_name":"Virtual reality","level":2,"score":0.29989999532699585},{"id":"https://openalex.org/C2780440489","wikidata":"https://www.wikidata.org/wiki/Q5227278","display_name":"Data-driven","level":2,"score":0.29409998655319214},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2870999872684479},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2824000120162964},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.2770000100135803},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.26739999651908875},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.26179999113082886},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.25780001282691956},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.25600001215934753}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/comcomap68359.2025.11353140","is_oa":false,"landing_page_url":"https://doi.org/10.1109/comcomap68359.2025.11353140","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Computing, Communications and IoT Applications (ComComAp)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4139823913574219,"id":"https://metadata.un.org/sdg/15","display_name":"Life in Land"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W2397253692","https://openalex.org/W2605102758","https://openalex.org/W2607968634","https://openalex.org/W2767050701","https://openalex.org/W2911087563","https://openalex.org/W4231563569","https://openalex.org/W4367016688","https://openalex.org/W4383097638","https://openalex.org/W4385403811","https://openalex.org/W4402353985"],"related_works":[],"abstract_inverted_index":{"Physical":[0,41],"Artificial":[1],"Intelligence":[2],"(AI),":[3],"or":[4],"embodied":[5],"AI,":[6,42],"represents":[7],"a":[8,18,33,55,60,90,109],"paradigm":[9],"shift":[10],"from":[11],"purely":[12],"virtual":[13],"intelligence":[14],"to":[15,102],"systems":[16],"with":[17,119],"physical":[19],"presence":[20],"capable":[21],"of":[22,36,40,47,64,148,158],"perceiving,":[23],"reasoning,":[24],"and":[25,50,85,142,151],"acting":[26],"upon":[27],"the":[28,37,44,65,139,146,156],"world.":[29],"This":[30],"survey":[31,131],"provides":[32],"comprehensive":[34],"review":[35],"foundational":[38],"concepts":[39],"highlighting":[43],"critical":[45],"role":[46],"foundation":[48],"models":[49,150],"integrated":[51],"development":[52,92],"platforms.":[53],"As":[54],"case":[56],"study,":[57],"we":[58],"conduct":[59],"deep":[61],"vertical":[62],"analysis":[63,107],"NVIDIA":[66],"ecosystem,":[67],"examining":[68],"how":[69],"simulation":[70],"(Omniverse,":[71],"Isaac":[72],"Sim),":[73],"synthetic":[74],"data":[75],"generation":[76],"(Cosmos),":[77],"robot":[78],"learning":[79],"(Isaac":[80,83],"Lab),":[81],"perception":[82],"ROS),":[84],"edge":[86],"computing":[87],"(Jetson)":[88],"create":[89],"self-reinforcing":[91],"cycle.":[93],"We":[94],"further":[95],"analyze":[96],"state-of-the-art":[97],"architectures,":[98],"comparing":[99],"language-grounded":[100],"planners":[101],"generalist":[103],"Vision-Language-Action":[104],"policies.":[105],"Our":[106],"reveals":[108],"clear":[110],"convergence":[111,147],"towards":[112],"hybrid":[113],"architectures":[114],"that":[115],"combine":[116],"deliberative":[117],"reasoning":[118],"reactive":[120],"control,":[121],"heavily":[122],"relying":[123],"on":[124],"standards":[125],"like":[126],"OpenUSD":[127],"for":[128],"interoperability.":[129],"The":[130],"concludes":[132],"by":[133],"discussing":[134],"key":[135],"limitations,":[136],"such":[137],"as":[138],"sim-to-real":[140],"gap":[141],"proprietary":[143],"lock-in,":[144],"emphasizing":[145],"learned":[149],"classical":[152],"techniques":[153],"in":[154],"shaping":[155],"future":[157],"autonomous":[159],"systems.":[160]},"counts_by_year":[],"updated_date":"2026-02-01T03:34:12.195049","created_date":"2026-01-30T00:00:00"}
