{"id":"https://openalex.org/W7140470349","doi":"https://doi.org/10.48550/arxiv.2603.24097","title":"LaDy: Lagrangian-Dynamic Informed Network for Skeleton-based Action Segmentation via Spatial-Temporal Modulation","display_name":"LaDy: Lagrangian-Dynamic Informed Network for Skeleton-based Action Segmentation via Spatial-Temporal Modulation","publication_year":2026,"publication_date":"2026-03-25","ids":{"openalex":"https://openalex.org/W7140470349","doi":"https://doi.org/10.48550/arxiv.2603.24097"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.24097","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.24097","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.24097","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088582121","display_name":"Haoyu Ji","orcid":"https://orcid.org/0009-0007-2150-0791"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ji, Haoyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130712509","display_name":"Xueting Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Xueting","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130643096","display_name":"Yu Gao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Yu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122089455","display_name":"Wenze Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Wenze","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130668440","display_name":"Zhihao Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Zhihao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072203497","display_name":"Weihong Ren","orcid":"https://orcid.org/0000-0003-3839-0078"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ren, Weihong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130705844","display_name":"Zhiyong Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zhiyong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130664673","display_name":"Honghai Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Honghai","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5088582121"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9350000023841858,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9350000023841858,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.018699999898672104,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.008500000461935997,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.6826000213623047},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6349999904632568},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.5672000050544739},{"id":"https://openalex.org/keywords/salient","display_name":"Salient","score":0.5260999798774719},{"id":"https://openalex.org/keywords/boundary","display_name":"Boundary (topology)","score":0.4943999946117401},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.4442000091075897},{"id":"https://openalex.org/keywords/dynamics","display_name":"Dynamics (music)","score":0.4323999881744385},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.41440001130104065},{"id":"https://openalex.org/keywords/kinematics","display_name":"Kinematics","score":0.4090999960899353},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.40619999170303345}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.6826000213623047},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6349999904632568},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6287000179290771},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.5672000050544739},{"id":"https://openalex.org/C2780719617","wikidata":"https://www.wikidata.org/wiki/Q1030752","display_name":"Salient","level":2,"score":0.5260999798774719},{"id":"https://openalex.org/C62354387","wikidata":"https://www.wikidata.org/wiki/Q875399","display_name":"Boundary (topology)","level":2,"score":0.4943999946117401},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4717999994754791},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.4442000091075897},{"id":"https://openalex.org/C145912823","wikidata":"https://www.wikidata.org/wiki/Q113558","display_name":"Dynamics (music)","level":2,"score":0.4323999881744385},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.41440001130104065},{"id":"https://openalex.org/C39920418","wikidata":"https://www.wikidata.org/wiki/Q11476","display_name":"Kinematics","level":2,"score":0.4090999960899353},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.40619999170303345},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.3776000142097473},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.3698999881744385},{"id":"https://openalex.org/C2780186347","wikidata":"https://www.wikidata.org/wiki/Q11414","display_name":"Subnetwork","level":2,"score":0.36399999260902405},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.35260000824928284},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.3343000113964081},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3160000145435333},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.299699991941452},{"id":"https://openalex.org/C77405623","wikidata":"https://www.wikidata.org/wiki/Q598451","display_name":"System dynamics","level":2,"score":0.2939999997615814},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.28999999165534973},{"id":"https://openalex.org/C107551265","wikidata":"https://www.wikidata.org/wiki/Q1458245","display_name":"Displacement (psychology)","level":2,"score":0.2896000146865845},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.2863999903202057},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.28349998593330383},{"id":"https://openalex.org/C28461519","wikidata":"https://www.wikidata.org/wiki/Q2037529","display_name":"Rigid body dynamics","level":3,"score":0.28029999136924744},{"id":"https://openalex.org/C2776937971","wikidata":"https://www.wikidata.org/wiki/Q4384217","display_name":"Heading (navigation)","level":2,"score":0.2736000120639801},{"id":"https://openalex.org/C123079801","wikidata":"https://www.wikidata.org/wiki/Q750240","display_name":"Modulation (music)","level":2,"score":0.2720000147819519},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.26989999413490295},{"id":"https://openalex.org/C117896860","wikidata":"https://www.wikidata.org/wiki/Q11376","display_name":"Acceleration","level":2,"score":0.26750001311302185},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.26489999890327454},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.26440000534057617},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.26409998536109924},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.2637999951839447},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.26010000705718994},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.25760000944137573},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.2563999891281128},{"id":"https://openalex.org/C116672817","wikidata":"https://www.wikidata.org/wiki/Q1454986","display_name":"Physical system","level":2,"score":0.2522999942302704}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.24097","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.24097","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.24097","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.24097","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.6023861765861511,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Skeleton-based":[0],"Temporal":[1],"Action":[2],"Segmentation":[3],"(STAS)":[4],"aims":[5],"to":[6,96,144],"densely":[7],"parse":[8],"untrimmed":[9],"skeletal":[10],"sequences":[11],"into":[12,75],"frame-level":[13],"action":[14,180],"categories.":[15],"However,":[16],"existing":[17],"methods,":[18],"while":[19],"proficient":[20],"at":[21,185],"capturing":[22],"spatio-temporal":[23],"kinematics,":[24],"neglect":[25],"the":[26,63,76,99,112,120,124,174],"underlying":[27],"physical":[28,94,105,177],"dynamics":[29,74,129,178],"that":[30,168],"govern":[31],"human":[32],"motion.":[33],"This":[34],"oversight":[35],"limits":[36],"inter-class":[37],"discriminability":[38],"between":[39],"actions":[40],"with":[41,119,141],"similar":[42],"kinematics":[43],"but":[44],"distinct":[45],"dynamic":[46,54,151],"intents,":[47],"and":[48,88],"hinders":[49],"precise":[50],"boundary":[51,161],"localization":[52],"where":[53],"force":[55],"profiles":[56],"shift.":[57],"To":[58,102],"address":[59],"these,":[60],"we":[61],"propose":[62],"Lagrangian-Dynamic":[64],"Informed":[65],"Network":[66],"(LaDy),":[67],"a":[68,132],"framework":[69],"integrating":[70],"principles":[71],"of":[72,176],"Lagrangian":[73,91],"segmentation":[77],"process.":[78],"Specifically,":[79],"LaDy":[80,169],"first":[81],"computes":[82],"generalized":[83,100,137],"coordinates":[84],"from":[85],"joint":[86],"positions":[87],"then":[89,130],"estimates":[90],"terms":[92],"under":[93],"constraints":[95],"explicitly":[97],"synthesize":[98],"forces.":[101],"further":[103],"ensure":[104],"coherence,":[106],"our":[107],"Energy":[108],"Consistency":[109],"Loss":[110],"enforces":[111],"work-energy":[113],"theorem,":[114],"aligning":[115],"kinetic":[116],"energy":[117],"change":[118],"work":[121],"done":[122],"by":[123],"net":[125],"force.":[126],"The":[127],"learned":[128],"drive":[131],"Spatio-Temporal":[133],"Modulation":[134],"module:":[135],"Spatially,":[136],"forces":[138],"are":[139,153],"fused":[140],"spatial":[142],"representations":[143],"provide":[145],"more":[146],"discriminative":[147],"semantics.":[148],"Temporally,":[149],"salient":[150],"signals":[152],"constructed":[154],"for":[155,179],"temporal":[156],"gating,":[157],"thereby":[158],"significantly":[159],"enhancing":[160],"awareness.":[162],"Experiments":[163],"on":[164],"challenging":[165],"datasets":[166],"show":[167],"achieves":[170],"state-of-the-art":[171],"performance,":[172],"validating":[173],"integration":[175],"segmentation.":[181],"Code":[182],"is":[183],"available":[184],"https://github.com/HaoyuJi/LaDy.":[186]},"counts_by_year":[],"updated_date":"2026-03-27T06:05:27.210665","created_date":"2026-03-27T00:00:00"}
