{"id":"https://openalex.org/W7139118315","doi":"https://doi.org/10.48550/arxiv.2603.16343","title":"Learning Human-Object Interaction for 3D Human Pose Estimation from LiDAR Point Clouds","display_name":"Learning Human-Object Interaction for 3D Human Pose Estimation from LiDAR Point Clouds","publication_year":2026,"publication_date":"2026-03-17","ids":{"openalex":"https://openalex.org/W7139118315","doi":"https://doi.org/10.48550/arxiv.2603.16343"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.16343","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16343","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.16343","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5104156507","display_name":"Daniel Sungho Jung","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jung, Daniel Sungho","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130062164","display_name":"Dohee Cho","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cho, Dohee","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130056398","display_name":"Kyoung Hyun Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Kyoung Mu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.7134000062942505,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.7134000062942505,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.0632999986410141,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.03180000185966492,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ambiguity","display_name":"Ambiguity","score":0.6948999762535095},{"id":"https://openalex.org/keywords/point-cloud","display_name":"Point cloud","score":0.652400016784668},{"id":"https://openalex.org/keywords/lidar","display_name":"Lidar","score":0.631600022315979},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.6147000193595886},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.5695000290870667},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.49540001153945923},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4659000039100647},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.45989999175071716},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.4323999881744385}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7107999920845032},{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.6948999762535095},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6934999823570251},{"id":"https://openalex.org/C131979681","wikidata":"https://www.wikidata.org/wiki/Q1899648","display_name":"Point cloud","level":2,"score":0.652400016784668},{"id":"https://openalex.org/C51399673","wikidata":"https://www.wikidata.org/wiki/Q504027","display_name":"Lidar","level":2,"score":0.631600022315979},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.6147000193595886},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.5695000290870667},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.49540001153945923},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4684000015258789},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4659000039100647},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.45989999175071716},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.4323999881744385},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.34929999709129333},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32170000672340393},{"id":"https://openalex.org/C115051666","wikidata":"https://www.wikidata.org/wiki/Q6522493","display_name":"Ranging","level":2,"score":0.3165999948978424},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.3050000071525574},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3012000024318695},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.2930999994277954},{"id":"https://openalex.org/C145460709","wikidata":"https://www.wikidata.org/wiki/Q859951","display_name":"Human\u2013robot interaction","level":3,"score":0.2879999876022339},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.2784000039100647},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.27149999141693115},{"id":"https://openalex.org/C2777113093","wikidata":"https://www.wikidata.org/wiki/Q221488","display_name":"Pedestrian","level":2,"score":0.2705000042915344},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.26159998774528503},{"id":"https://openalex.org/C2987082051","wikidata":"https://www.wikidata.org/wiki/Q223642","display_name":"Human interaction","level":2,"score":0.2606000006198883},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2599000036716461},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.2572000026702881},{"id":"https://openalex.org/C38764148","wikidata":"https://www.wikidata.org/wiki/Q17098245","display_name":"Interaction information","level":2,"score":0.2515999972820282},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.250900000333786}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.16343","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16343","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.16343","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16343","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.5827454328536987},{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.4590774178504944}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Understanding":[0],"humans":[1],"from":[2,142,198],"LiDAR":[3,122,143],"point":[4,144],"clouds":[5],"is":[6],"one":[7],"of":[8,31,45,66,101],"the":[9,29,43,64,99,110,148,175],"most":[10],"critical":[11],"tasks":[12],"in":[13,28,89,98,121,170,238],"autonomous":[14],"driving":[15],"due":[16],"to":[17,49,83,231],"its":[18],"close":[19],"relationships":[20],"with":[21,109],"pedestrian":[22],"safety,":[23],"yet":[24],"it":[25],"remains":[26],"challenging":[27],"presence":[30],"diverse":[32],"human-object":[33,47,67,70,154,229],"interactions":[34,48,71],"and":[35,77,105,116,166,235],"cluttered":[36],"backgrounds.":[37],"Nevertheless,":[38],"existing":[39],"methods":[40],"largely":[41],"overlook":[42],"potential":[44],"leveraging":[46],"build":[50],"robust":[51,137],"3D":[52,85,138],"human":[53,76,86,139,165],"pose":[54,140],"estimation":[55,141],"frameworks.":[56],"There":[57],"are":[58],"two":[59],"major":[60],"challenges":[61],"that":[62,159,185,211],"motivate":[63],"incorporation":[65],"interaction.":[68],"First,":[69],"introduce":[72,180],"spatial":[73,149,233],"ambiguity":[74,150,234],"between":[75,103,164],"object":[78,167],"points,":[79,168],"which":[80],"often":[81],"leads":[82],"erroneous":[84,213],"keypoint":[87,215],"predictions":[88],"interaction":[90,171,230,239],"regions.":[91,172,240],"Second,":[92],"there":[93],"exists":[94],"severe":[95],"class":[96,176,236],"imbalance":[97,177,237],"number":[100],"points":[102,193,197],"interacting":[104,199],"non-interacting":[106],"body":[107,200],"parts,":[108],"interaction-frequent":[111],"regions":[112],"such":[113],"as":[114],"hand":[115],"foot":[117],"being":[118],"sparsely":[119],"observed":[120],"data.":[123],"To":[124,146,173],"address":[125],"these":[126],"challenges,":[127],"we":[128,152,179,204],"propose":[129],"a":[130,223],"Human-Object":[131],"Interaction":[132],"Learning":[133],"(HOIL)":[134],"framework":[135],"for":[136],"clouds.":[145],"mitigate":[147],"issue,":[151,178],"present":[153,205],"interaction-aware":[155],"contrastive":[156],"learning":[157],"(HOICL)":[158],"effectively":[160,227],"enhances":[161],"feature":[162],"discrimination":[163],"particularly":[169],"alleviate":[174],"contact-aware":[181],"part-guided":[182],"pooling":[183],"(CPPool)":[184],"adaptively":[186],"reallocates":[187],"representational":[188],"capacity":[189],"by":[190],"compressing":[191],"overrepresented":[192],"while":[194],"preserving":[195],"informative":[196],"parts.":[201],"In":[202],"addition,":[203],"an":[206],"optional":[207],"contact-based":[208],"temporal":[209],"refinement":[210],"refines":[212],"per-frame":[214],"estimates":[216],"using":[217],"contact":[218],"cues":[219],"over":[220],"time.":[221],"As":[222],"result,":[224],"our":[225],"HOIL":[226],"leverages":[228],"resolve":[232],"Codes":[241],"will":[242],"be":[243],"released.":[244]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-20T00:00:00"}
