{"id":"https://openalex.org/W3196614915","doi":"https://doi.org/10.1145/3460426.3463605","title":"HPOF:3D Human Pose Recovery from Monocular Video with Optical Flow","display_name":"HPOF:3D Human Pose Recovery from Monocular Video with Optical Flow","publication_year":2021,"publication_date":"2021-08-24","ids":{"openalex":"https://openalex.org/W3196614915","doi":"https://doi.org/10.1145/3460426.3463605","mag":"3196614915"},"language":"en","primary_location":{"id":"doi:10.1145/3460426.3463605","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3460426.3463605","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2021 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5021280842","display_name":"Bin Ji","orcid":"https://orcid.org/0000-0002-8981-5251"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Bin Ji","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100350500","display_name":"Yang Chen","orcid":"https://orcid.org/0000-0003-4496-7849"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chen Yang","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000577985","display_name":"Shunyu Yao","orcid":"https://orcid.org/0000-0002-1683-286X"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yao Shunyu","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052414408","display_name":"Ye Pan","orcid":"https://orcid.org/0000-0002-2645-1809"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ye Pan","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5021280842"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":0.1921,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.48887255,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"144","last_page":"154"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11227","display_name":"Diabetic Foot Ulcer Assessment and Management","score":0.9860000014305115,"subfield":{"id":"https://openalex.org/subfields/2712","display_name":"Endocrinology, Diabetes and Metabolism"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.820723295211792},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.766508936882019},{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.6724915504455566},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6724432706832886},{"id":"https://openalex.org/keywords/optical-flow","display_name":"Optical flow","score":0.6707395315170288},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6415313482284546},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5617071986198425},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5151968598365784},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.506320595741272},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.49840855598449707},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.4973185360431671},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.4832957088947296},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3333103656768799},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.24114349484443665}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.820723295211792},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.766508936882019},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.6724915504455566},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6724432706832886},{"id":"https://openalex.org/C155542232","wikidata":"https://www.wikidata.org/wiki/Q736111","display_name":"Optical flow","level":3,"score":0.6707395315170288},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6415313482284546},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5617071986198425},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5151968598365784},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.506320595741272},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.49840855598449707},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.4973185360431671},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.4832957088947296},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3333103656768799},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.24114349484443665},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3460426.3463605","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3460426.3463605","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2021 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":55,"referenced_works":["https://openalex.org/W1496316025","https://openalex.org/W1943191679","https://openalex.org/W1967554269","https://openalex.org/W1976333597","https://openalex.org/W2064675550","https://openalex.org/W2101032778","https://openalex.org/W2137591992","https://openalex.org/W2172156083","https://openalex.org/W2194775991","https://openalex.org/W2502928967","https://openalex.org/W2545173102","https://openalex.org/W2554247908","https://openalex.org/W2560474170","https://openalex.org/W2573098616","https://openalex.org/W2604375920","https://openalex.org/W2612706635","https://openalex.org/W2756050327","https://openalex.org/W2771965516","https://openalex.org/W2797184202","https://openalex.org/W2797515701","https://openalex.org/W2798411580","https://openalex.org/W2798637590","https://openalex.org/W2798646183","https://openalex.org/W2916798096","https://openalex.org/W2956061722","https://openalex.org/W2962730651","https://openalex.org/W2962754033","https://openalex.org/W2962896489","https://openalex.org/W2963515833","https://openalex.org/W2963527086","https://openalex.org/W2963590054","https://openalex.org/W2963688992","https://openalex.org/W2963782415","https://openalex.org/W2963873475","https://openalex.org/W2963907666","https://openalex.org/W2963995996","https://openalex.org/W2964084369","https://openalex.org/W2964156315","https://openalex.org/W2964304707","https://openalex.org/W2971856312","https://openalex.org/W2975420824","https://openalex.org/W2978956737","https://openalex.org/W2981637078","https://openalex.org/W2981660954","https://openalex.org/W2984612350","https://openalex.org/W2990270790","https://openalex.org/W2993728126","https://openalex.org/W3035551320","https://openalex.org/W3037374099","https://openalex.org/W3110095664","https://openalex.org/W3177525997","https://openalex.org/W4236667477","https://openalex.org/W4249009392","https://openalex.org/W4251108253","https://openalex.org/W4301045096"],"related_works":["https://openalex.org/W2123263858","https://openalex.org/W3127959533","https://openalex.org/W4390516098","https://openalex.org/W2181948922","https://openalex.org/W2384362569","https://openalex.org/W4387967917","https://openalex.org/W200819717","https://openalex.org/W4307623796","https://openalex.org/W4394784820","https://openalex.org/W3005839910"],"abstract_inverted_index":{"This":[0],"paper":[1],"introduces":[2],"HPOF,":[3],"a":[4,16,36,52,56,131,137,163,192],"novel":[5,132],"deep":[6],"neural":[7],"network":[8],"to":[9,25,40,82,107,117,172,186,220],"reconstruct":[10],"the":[11,27,42,45,49,61,73,83,91,109,144,154,157,188,202,209,214,222,229],"3D":[12,67,205],"human":[13,148],"motion":[14],"from":[15,51],"monocular":[17],"video.":[18,215],"Recently,":[19],"model-based":[20],"methods":[21],"have":[22],"been":[23],"proposed":[24],"simplify":[26],"reconstruction":[28,189],"task":[29],"by":[30],"estimating":[31],"several":[32],"parameters":[33,50],"that":[34,197],"control":[35],"deformable":[37],"surface":[38],"model":[39],"fit":[41],"person":[43],"in":[44,99,191],"image.":[46],"However,":[47],"learning":[48,145,182],"single":[53],"image":[54],"is":[55,63,79,184],"highly":[57],"ill-posed":[58],"problem,":[59],"and":[60,72,150,160,227],"process":[62,146,168],"ultimately":[64],"data-hungry.":[65],"Existing":[66],"datasets":[68,78],"are":[69],"not":[70,199],"sufficient,":[71],"usage":[74],"of":[75,86,113,147,156,204,224,231],"2D":[76,110],"in-the-wild":[77],"often":[80],"susceptible":[81],"inadequate":[84],"precision":[85],"manual":[87],"annotations.":[88],"To":[89],"address":[90],"above":[92],"issues,":[93],"our":[94,225,232],"method":[95,226],"yields":[96],"substantial":[97],"improvements":[98],"two":[100],"domains.":[101],"First,":[102],"we":[103,129],"leverage":[104],"optical":[105],"flow":[106],"supervise":[108,187],"rendered":[111],"images":[112],"predicted":[114],"SMPL":[115],"models":[116],"learn":[118],"short-term":[119],"temporal":[120,125,133],"features.":[121],"Besides,":[122],"taking":[123],"long-term":[124],"consistency":[126],"into":[127],"account,":[128],"define":[130],"encoder":[134,142],"based":[135],"on":[136,169],"dilated":[138],"convolutional":[139],"network.":[140],"The":[141],"decomposes":[143],"shape":[149],"pose,":[151],"first":[152],"guarantees":[153],"invariance":[155],"body":[158,211],"shape,":[159],"then":[161],"simulates":[162],"more":[164,174],"reasonable":[165],"forward":[166],"kinematics":[167],"this":[170],"basis":[171],"achieve":[173],"accurate":[175],"pose":[176],"estimation.":[177],"In":[178],"addition,":[179],"an":[180],"adversarial":[181],"framework":[183],"applied":[185],"progress":[190],"coarse-grained":[193],"way.":[194],"We":[195,216],"show":[196],"HPOF":[198],"only":[200],"improves":[201],"accuracy":[203],"poses":[206],"but":[207],"ensures":[208],"realistic":[210],"structure":[212],"throughout":[213],"perform":[217],"extensive":[218],"experimentation":[219],"demonstrate":[221],"superiority":[223],"analyze":[228],"effectiveness":[230],"model,":[233],"surpassing":[234],"other":[235],"state-of-the-arts.":[236]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
