{"id":"https://openalex.org/W4415332376","doi":"https://doi.org/10.48550/arxiv.2509.23455","title":"3DPCNet: Pose Canonicalization for Robust Viewpoint-Invariant 3D Kinematic Analysis from Monocular RGB cameras","display_name":"3DPCNet: Pose Canonicalization for Robust Viewpoint-Invariant 3D Kinematic Analysis from Monocular RGB cameras","publication_year":2025,"publication_date":"2025-09-27","ids":{"openalex":"https://openalex.org/W4415332376","doi":"https://doi.org/10.48550/arxiv.2509.23455"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2509.23455","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.23455","pdf_url":"https://arxiv.org/pdf/2509.23455","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2509.23455","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079517833","display_name":"Thushara Ekanayake","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ekanayake, Tharindu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051136793","display_name":"Constantino \u00c1lvarez Casado","orcid":"https://orcid.org/0000-0002-3052-4759"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Casado, Constantino \u00c1lvarez","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5005498985","display_name":"Miguel Bordallo L\u00f3pez","orcid":"https://orcid.org/0000-0002-5707-9085"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"L\u00f3pez, Miguel Bordallo","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5079517833"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.6776999831199646},{"id":"https://openalex.org/keywords/kinematics","display_name":"Kinematics","score":0.5910000205039978},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.5149999856948853},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.49619999527931213},{"id":"https://openalex.org/keywords/rotation","display_name":"Rotation (mathematics)","score":0.45750001072883606},{"id":"https://openalex.org/keywords/inertial-measurement-unit","display_name":"Inertial measurement unit","score":0.415800005197525},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.4059999883174896},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4000999927520752}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7487000226974487},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7091000080108643},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.6776999831199646},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6409000158309937},{"id":"https://openalex.org/C39920418","wikidata":"https://www.wikidata.org/wiki/Q11476","display_name":"Kinematics","level":2,"score":0.5910000205039978},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.5149999856948853},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.49619999527931213},{"id":"https://openalex.org/C74050887","wikidata":"https://www.wikidata.org/wiki/Q848368","display_name":"Rotation (mathematics)","level":2,"score":0.45750001072883606},{"id":"https://openalex.org/C79061980","wikidata":"https://www.wikidata.org/wiki/Q941680","display_name":"Inertial measurement unit","level":2,"score":0.415800005197525},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.4059999883174896},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4000999927520752},{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.3982999920845032},{"id":"https://openalex.org/C185429906","wikidata":"https://www.wikidata.org/wiki/Q1130160","display_name":"Estimator","level":2,"score":0.39239999651908875},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.3833000063896179},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.3662000000476837},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.3531999886035919},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.32109999656677246},{"id":"https://openalex.org/C158829959","wikidata":"https://www.wikidata.org/wiki/Q1640606","display_name":"Monocular vision","level":2,"score":0.3174999952316284},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.3041999936103821},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.29179999232292175},{"id":"https://openalex.org/C83633838","wikidata":"https://www.wikidata.org/wiki/Q1256564","display_name":"Rotation matrix","level":2,"score":0.2797999978065491},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.26570001244544983},{"id":"https://openalex.org/C193581530","wikidata":"https://www.wikidata.org/wiki/Q683778","display_name":"Structured light","level":2,"score":0.2606000006198883}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2509.23455","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.23455","pdf_url":"https://arxiv.org/pdf/2509.23455","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2509.23455","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2509.23455","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2509.23455","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.23455","pdf_url":"https://arxiv.org/pdf/2509.23455","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Monocular":[0],"3D":[1,34],"pose":[2,41,118],"estimators":[3],"produce":[4],"camera-centered":[5],"skeletons,":[6],"creating":[7],"view-dependent":[8],"kinematic":[9],"signals":[10,166],"that":[11,30,81,161,169,180],"complicate":[12],"comparative":[13],"analysis":[14],"in":[15,96],"applications":[16],"such":[17],"as":[18],"health":[19],"and":[20,117,135],"sports":[21],"science.":[22],"We":[23,92],"present":[24],"3DPCNet,":[25],"a":[26,43,56,64,67,77,97,110,150],"compact,":[27],"estimator-agnostic":[28],"module":[29,182],"operates":[31],"directly":[32],"on":[33,100,155],"joint":[35],"coordinates":[36],"to":[37,84,88,133,145,149,174,186],"rectify":[38],"any":[39],"input":[40],"into":[42],"consistent,":[44],"body-centered":[45],"canonical":[46],"frame.":[47],"Its":[48],"hybrid":[49],"encoder":[50],"fuses":[51],"local":[52],"skeletal":[53],"features":[54],"from":[55,63,130,142,167],"graph":[57],"convolutional":[58],"network":[59],"with":[60],"global":[61],"context":[62],"transformer":[65],"via":[66],"gated":[68],"cross-attention":[69],"mechanism.":[70],"From":[71],"this":[72],"representation,":[73],"the":[74,90,94,101,121,126,136,156],"model":[75,95],"predicts":[76],"continuous":[78],"6D":[79],"rotation":[80,116,128],"is":[82],"mapped":[83],"an":[85],"$SO(3)$":[86],"matrix":[87],"align":[89],"pose.":[91],"train":[93],"self-supervised":[98],"manner":[99],"MM-Fi":[102,122],"dataset":[103,158],"using":[104],"synthetically":[105],"rotated":[106],"poses,":[107],"guided":[108],"by":[109],"composite":[111],"loss":[112],"ensuring":[113],"both":[114],"accurate":[115],"reconstruction.":[119],"On":[120],"benchmark,":[123],"3DPCNet":[124],"reduces":[125],"mean":[127],"error":[129],"over":[131],"20$^{\\circ}$":[132],"3.4$^{\\circ}$":[134],"Mean":[137],"Per":[138],"Joint":[139],"Position":[140],"Error":[141],"~64":[143],"mm":[144,147],"47":[146],"compared":[148],"geometric":[151],"baseline.":[152],"Qualitative":[153],"evaluations":[154],"TotalCapture":[157],"further":[159],"demonstrate":[160],"our":[162,181],"method":[163],"produces":[164],"acceleration":[165],"video":[168],"show":[170],"strong":[171],"visual":[172],"correspondence":[173],"ground-truth":[175],"IMU":[176],"sensor":[177],"data,":[178],"confirming":[179],"removes":[183],"viewpoint":[184],"variability":[185],"enable":[187],"physically":[188],"plausible":[189],"motion":[190],"analysis.":[191]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-19T00:00:00"}
