{"id":"https://openalex.org/W4409160016","doi":"https://doi.org/10.1145/3727984","title":"Multi-Person Pose Estimation with Feature Enhancement and Decoupling Based on Contrastive Learning","display_name":"Multi-Person Pose Estimation with Feature Enhancement and Decoupling Based on Contrastive Learning","publication_year":2025,"publication_date":"2025-04-04","ids":{"openalex":"https://openalex.org/W4409160016","doi":"https://doi.org/10.1145/3727984"},"language":"en","primary_location":{"id":"doi:10.1145/3727984","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3727984","pdf_url":null,"source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103097907","display_name":"Zhiyuan Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"education","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhiyuan Liu","raw_affiliation_strings":["School of Computer Science and Technology, Beijing Jiaotong University, Beijing, China","Beijing Jiaotong University, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Beijing Jiaotong University, Beijing, China","institution_ids":["https://openalex.org/I21193070"]},{"raw_affiliation_string":"Beijing Jiaotong University, China","institution_ids":["https://openalex.org/I21193070"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101696368","display_name":"Qi Zou","orcid":"https://orcid.org/0000-0002-8070-5267"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"education","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Zou","raw_affiliation_strings":["School of Computer Science and Technology, Beijing Jiaotong University, Beijing, China","Beijing Jiaotong University, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Beijing Jiaotong University, Beijing, China","institution_ids":["https://openalex.org/I21193070"]},{"raw_affiliation_string":"Beijing Jiaotong University, China","institution_ids":["https://openalex.org/I21193070"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067613982","display_name":"Xixia Xu","orcid":"https://orcid.org/0000-0001-6305-475X"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210107198","display_name":"State Key Laboratory of Transducer Technology","ror":"https://ror.org/01qg56n75","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366","https://openalex.org/I19820366","https://openalex.org/I4210107198","https://openalex.org/I4210110458","https://openalex.org/I4210147322"]},{"id":"https://openalex.org/I4210147322","display_name":"Shanghai Institute of Microsystem and Information Technology","ror":"https://ror.org/04nytyj38","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210147322"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xixia Xu","raw_affiliation_strings":["Bionic Vision System Laboratory, State Key Laboratory of Transducer Technology, Shanghai Institute of Microsystem and Information Technology, Chinese Academy of Sciences, Shanghai, China","Chinese Academy of Sciences, China"],"affiliations":[{"raw_affiliation_string":"Bionic Vision System Laboratory, State Key Laboratory of Transducer Technology, Shanghai Institute of Microsystem and Information Technology, Chinese Academy of Sciences, Shanghai, China","institution_ids":["https://openalex.org/I4210107198","https://openalex.org/I4210147322"]},{"raw_affiliation_string":"Chinese Academy of Sciences, China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5076339674","display_name":"Yanting Pei","orcid":"https://orcid.org/0000-0003-2462-4777"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"education","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanting Pei","raw_affiliation_strings":["School of Computer Science and Technology, Beijing Jiaotong University, Beijing, China","Beijing Jiaotong University, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Beijing Jiaotong University, Beijing, China","institution_ids":["https://openalex.org/I21193070"]},{"raw_affiliation_string":"Beijing Jiaotong University, China","institution_ids":["https://openalex.org/I21193070"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5103097907"],"corresponding_institution_ids":["https://openalex.org/I21193070"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.05230126,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"21","issue":"6","first_page":"1","last_page":"23"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9109584093093872},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7066180109977722},{"id":"https://openalex.org/keywords/decoupling","display_name":"Decoupling (probability)","score":0.6706697940826416},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5998942255973816},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.5513765215873718},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.46557849645614624},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4313663840293884},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.4246971607208252},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.41312819719314575},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.32218414545059204}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9109584093093872},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7066180109977722},{"id":"https://openalex.org/C205606062","wikidata":"https://www.wikidata.org/wiki/Q5249645","display_name":"Decoupling (probability)","level":2,"score":0.6706697940826416},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5998942255973816},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.5513765215873718},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.46557849645614624},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4313663840293884},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.4246971607208252},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41312819719314575},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.32218414545059204},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3727984","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3727984","pdf_url":null,"source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W1530404542","https://openalex.org/W1861492603","https://openalex.org/W2175012183","https://openalex.org/W2307770531","https://openalex.org/W2578797046","https://openalex.org/W2962773068","https://openalex.org/W2962820842","https://openalex.org/W2962954622","https://openalex.org/W2963150697","https://openalex.org/W2963402313","https://openalex.org/W2963781481","https://openalex.org/W2993728126","https://openalex.org/W3012573144","https://openalex.org/W3014641072","https://openalex.org/W3034399482","https://openalex.org/W3082133990","https://openalex.org/W3138516171","https://openalex.org/W3171398643","https://openalex.org/W3172013121","https://openalex.org/W3173964191","https://openalex.org/W3176892444","https://openalex.org/W3182545801","https://openalex.org/W3203572876","https://openalex.org/W3206609906","https://openalex.org/W4214508443","https://openalex.org/W4214573223","https://openalex.org/W4224992933","https://openalex.org/W4229890965","https://openalex.org/W4292787291","https://openalex.org/W4311727339","https://openalex.org/W4312632164","https://openalex.org/W4312925317","https://openalex.org/W4312967365","https://openalex.org/W4386065736","https://openalex.org/W4386075664","https://openalex.org/W4388192390","https://openalex.org/W4390873613","https://openalex.org/W4400786028"],"related_works":["https://openalex.org/W4313561376","https://openalex.org/W3103825105","https://openalex.org/W3027880158","https://openalex.org/W3207533102","https://openalex.org/W2905271011","https://openalex.org/W4280540140","https://openalex.org/W3164948662","https://openalex.org/W4289536128","https://openalex.org/W3153597579","https://openalex.org/W4298151006"],"abstract_inverted_index":{"Most":[0],"methods":[1],"of":[2,68,80],"multi-person":[3],"pose":[4],"estimation":[5],"(MPPE)":[6],"treat":[7],"the":[8,58,181],"human":[9,46],"detection":[10,47],"and":[11,48,66,70,83,106,117,126,140,149,154,163,170,189],"keypoint":[12,49,128],"localization":[13,129],"separately.":[14],"They":[15],"need":[16],"additional":[17,103],"supervision":[18,105],"like":[19,27,109],"instance":[20,64],"bounding":[21],"boxes,":[22],"or":[23,30],"complex":[24],"hand-crafted":[25],"processes":[26],"RoI":[28],"cropping":[29],"grouping.":[31],"In":[32],"this":[33],"article,":[34],"we":[35,73],"propose":[36],"a":[37,89,95],"novel":[38],"one-stage":[39,61],"MPPE":[40,101],"method,":[41],"named":[42],"COPE,":[43],"which":[44],"unifies":[45],"regression":[50],"into":[51],"an":[52],"end-to-end":[53],"learnable":[54],"framework.":[55],"To":[56],"handle":[57,123],"challenges":[59],"plague":[60],"MPPE,":[62],"i.e.,":[63],"overlapping":[65],"misalignment":[67],"local":[69],"global":[71],"context,":[72],"design":[74],"contrastive":[75,115],"constraints":[76,116],"at":[77],"two":[78],"levels":[79],"semantic":[81],"granularity":[82],"feature":[84],"sampling":[85,118],"strategies.":[86],"Based":[87],"on":[88,143,161,180],"whole-process":[90],"differentiable":[91],"pipeline,":[92],"COPE":[93,120,157,175],"establishes":[94],"simple":[96],"yet":[97],"effective":[98],"framework":[99],"for":[100],"without":[102],"instance-level":[104],"resource-intensive":[107],"modules":[108],"transformer.":[110],"Benefit":[111],"from":[112],"specially":[113],"designed":[114],"strategies,":[119],"can":[121],"better":[122],"occluded":[124,155],"scenes":[125],"correct":[127],"errors.":[130],"Extensive":[131],"experiments":[132],"demonstrate":[133],"COPE\u2019s":[134],"superiority.":[135],"It":[136],"attains":[137],"71.3":[138],"AP":[139,169,188],"18.0":[141],"FPS":[142],"COCO":[144],"val2017,":[145],"effectively":[146],"balancing":[147],"accuracy":[148],"speed.":[150],"Particularly":[151],"in":[152],"crowded":[153],"scenarios,":[156],"achieves":[158],"state-of-the-art":[159],"performance":[160,179],"CrowdPose":[162],"OCHuman,":[164],"surpassing":[165],"CID":[166],"by":[167,186,191],"0.6":[168],"1.7":[171],"AP,":[172],"respectively.":[173],"Furthermore,":[174],"strongly":[176],"improves":[177],"generalization":[178],"Human-Art":[182],"benchmark,":[183],"outperforming":[184],"ED-Pose":[185],"6.7":[187],"ClickPose":[190],"3.7":[192],"AP.":[193]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
