{"id":"https://openalex.org/W2513076446","doi":"https://doi.org/10.1145/2964284.2964322","title":"Human Pose Estimation from Depth Images via Inference Embedded Multi-task Learning","display_name":"Human Pose Estimation from Depth Images via Inference Embedded Multi-task Learning","publication_year":2016,"publication_date":"2016-09-29","ids":{"openalex":"https://openalex.org/W2513076446","doi":"https://doi.org/10.1145/2964284.2964322","mag":"2513076446"},"language":"en","primary_location":{"id":"doi:10.1145/2964284.2964322","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2964284.2964322","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 24th ACM international conference on Multimedia","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088124671","display_name":"Keze Wang","orcid":"https://orcid.org/0000-0002-7817-8306"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Keze Wang","raw_affiliation_strings":["Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075393806","display_name":"Shengfu Zhai","orcid":null},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shengfu Zhai","raw_affiliation_strings":["Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101409148","display_name":"Hui Cheng","orcid":"https://orcid.org/0000-0003-2579-7004"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hui Cheng","raw_affiliation_strings":["Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047878798","display_name":"Xiaodan Liang","orcid":"https://orcid.org/0000-0003-3213-3062"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaodan Liang","raw_affiliation_strings":["Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5092355007","display_name":"Liang Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liang Lin","raw_affiliation_strings":["Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5088124671"],"corresponding_institution_ids":["https://openalex.org/I157773358"],"apc_list":null,"apc_paid":null,"fwci":2.84210053,"has_fulltext":false,"cited_by_count":37,"citation_normalized_percentile":{"value":0.94434344,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1227","last_page":"1236"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.8537224531173706},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8014682531356812},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.7854940891265869},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7581524848937988},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6292895078659058},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5907552242279053},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5618830323219299},{"id":"https://openalex.org/keywords/articulated-body-pose-estimation","display_name":"Articulated body pose estimation","score":0.5473135709762573},{"id":"https://openalex.org/keywords/kinematics","display_name":"Kinematics","score":0.4917652904987335},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4878220856189728},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.46564850211143494},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.4185444116592407},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4154198467731476},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.38356712460517883},{"id":"https://openalex.org/keywords/3d-pose-estimation","display_name":"3D pose estimation","score":0.3654230833053589},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08000442385673523}],"concepts":[{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.8537224531173706},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8014682531356812},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.7854940891265869},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7581524848937988},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6292895078659058},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5907552242279053},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5618830323219299},{"id":"https://openalex.org/C22100474","wikidata":"https://www.wikidata.org/wiki/Q4800952","display_name":"Articulated body pose estimation","level":4,"score":0.5473135709762573},{"id":"https://openalex.org/C39920418","wikidata":"https://www.wikidata.org/wiki/Q11476","display_name":"Kinematics","level":2,"score":0.4917652904987335},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4878220856189728},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.46564850211143494},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.4185444116592407},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4154198467731476},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.38356712460517883},{"id":"https://openalex.org/C36613465","wikidata":"https://www.wikidata.org/wiki/Q4636322","display_name":"3D pose estimation","level":3,"score":0.3654230833053589},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08000442385673523},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C74650414","wikidata":"https://www.wikidata.org/wiki/Q11397","display_name":"Classical mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2964284.2964322","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2964284.2964322","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 24th ACM international conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W31861159","https://openalex.org/W171061157","https://openalex.org/W1551519658","https://openalex.org/W1903029394","https://openalex.org/W1912860515","https://openalex.org/W1925417509","https://openalex.org/W1929856797","https://openalex.org/W1936750108","https://openalex.org/W1951304353","https://openalex.org/W1973255633","https://openalex.org/W1985912834","https://openalex.org/W1993164181","https://openalex.org/W2000205118","https://openalex.org/W2013640163","https://openalex.org/W2026720449","https://openalex.org/W2036196300","https://openalex.org/W2038052836","https://openalex.org/W2039262381","https://openalex.org/W2045798786","https://openalex.org/W2051090063","https://openalex.org/W2060280062","https://openalex.org/W2071730211","https://openalex.org/W2086618980","https://openalex.org/W2092423930","https://openalex.org/W2097041931","https://openalex.org/W2102605133","https://openalex.org/W2103015390","https://openalex.org/W2113325037","https://openalex.org/W2136391815","https://openalex.org/W2155394491","https://openalex.org/W2155893237","https://openalex.org/W2168356304","https://openalex.org/W2172156083","https://openalex.org/W2192598490","https://openalex.org/W2204578866","https://openalex.org/W2212123867","https://openalex.org/W2313077179","https://openalex.org/W2330154883","https://openalex.org/W2336626189","https://openalex.org/W2341907540","https://openalex.org/W2353169560","https://openalex.org/W2463113024","https://openalex.org/W2471048925","https://openalex.org/W2471138382","https://openalex.org/W2595840341","https://openalex.org/W2597851033","https://openalex.org/W2613433911","https://openalex.org/W2618530766","https://openalex.org/W2963048156","https://openalex.org/W2963592930","https://openalex.org/W2963758239","https://openalex.org/W3099037876","https://openalex.org/W3102322242","https://openalex.org/W3103722964","https://openalex.org/W3141021069","https://openalex.org/W6640131737"],"related_works":["https://openalex.org/W2946083937","https://openalex.org/W2798721181","https://openalex.org/W4386075737","https://openalex.org/W2951583186","https://openalex.org/W4299867837","https://openalex.org/W2088028039","https://openalex.org/W4382141741","https://openalex.org/W3165753266","https://openalex.org/W1968783203","https://openalex.org/W3213413335"],"abstract_inverted_index":{"Human":[0],"pose":[1,38,80,179],"estimation":[2,180],"(i.e.,":[3],"locating":[4],"the":[5,30,47,103,118,126,138,149,169,175],"body":[6,108,122,128,145],"parts":[7,109,123,146],"/":[8],"joints":[9],"of":[10,32,46,92,107,121,144,177],"a":[11,14,71,89,111,191],"person)":[12],"is":[13,86],"fundamental":[15],"problem":[16,52],"in":[17],"human-computer":[18],"interaction":[19],"and":[20,60,140,147],"multimedia":[21],"applications.":[22],"Significant":[23],"progress":[24],"has":[25],"been":[26],"made":[27],"based":[28,124],"on":[29,125],"development":[31],"depth":[33,42,83,199],"sensors,":[34],"i.e.,":[35],"accessible":[36],"human":[37,79,178],"prediction":[39],"from":[40,81],"still":[41,82],"images~\\cite{rf12pami}.":[43],"However,":[44],"most":[45],"existing":[48],"approaches":[49],"to":[50,63],"this":[51,67],"involve":[53],"several":[54,183],"components/models":[55],"that":[56,168],"are":[57,161],"independently":[58],"designed":[59],"optimized,":[61],"leading":[62],"suboptimal":[64],"performances.":[65],"In":[66],"paper,":[68],"we":[69,96],"propose":[70],"novel":[72],"inference-embedded":[73],"multi-task":[74],"learning":[75],"framework":[76],"for":[77,194],"predicting":[78],"images,":[84],"which":[85,136,196],"implemented":[87],"with":[88],"deep":[90,171],"architecture":[91],"neural":[93],"networks.":[94],"Specifically,":[95],"handle":[97],"two":[98,159],"cascaded":[99],"tasks:":[100],"i)":[101],"generating":[102],"heat":[104],"(confidence)":[105],"maps":[106],"via":[110,131],"fully":[112],"convolutional":[113],"network":[114,156],"(FCN);":[115],"ii)":[116],"seeking":[117],"optimal":[119],"configuration":[120],"detected":[127],"part":[129],"proposals":[130],"an":[132,154],"inference":[133,152],"built-in":[134],"MatchNet~\\cite{mn15cvpr},":[135],"measures":[137],"appearance":[139],"geometric":[141],"kinematic":[142],"compatibility":[143],"embodies":[148],"dynamic":[150],"programming":[151],"as":[153],"extra":[155],"layer.":[157],"These":[158],"tasks":[160],"jointly":[162],"optimized.":[163],"Our":[164],"extensive":[165],"experiments":[166],"show":[167],"proposed":[170],"model":[172],"significantly":[173],"improves":[174],"accuracy":[176],"over":[181],"other":[182],"state-of-the-art":[184],"methods":[185],"or":[186],"SDKs.":[187],"We":[188],"also":[189],"release":[190],"large-scale":[192],"dataset":[193],"comparison,":[195],"includes":[197],"100K":[198],"images":[200],"under":[201],"challenging":[202],"scenarios.":[203]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":11},{"year":2018,"cited_by_count":5},{"year":2017,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
