{"id":"https://openalex.org/W4392903368","doi":"https://doi.org/10.1109/icassp48485.2024.10448008","title":"Efficient Posenet with Coarse to Fine Transformer","display_name":"Efficient Posenet with Coarse to Fine Transformer","publication_year":2024,"publication_date":"2024-03-18","ids":{"openalex":"https://openalex.org/W4392903368","doi":"https://doi.org/10.1109/icassp48485.2024.10448008"},"language":"en","primary_location":{"id":"doi:10.1109/icassp48485.2024.10448008","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp48485.2024.10448008","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100367937","display_name":"Shaohua Li","orcid":"https://orcid.org/0000-0001-7115-5809"},"institutions":[{"id":"https://openalex.org/I1328775524","display_name":"Zhejiang Sci-Tech University","ror":"https://ror.org/03893we55","country_code":"CN","type":"education","lineage":["https://openalex.org/I1328775524"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shaohua Li","raw_affiliation_strings":["Zhejiang Sci-Tech University,School of Computer Science and Technology,Hangzhou,China","School of Computer Science and Technology, Zhejiang Sci-Tech University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang Sci-Tech University,School of Computer Science and Technology,Hangzhou,China","institution_ids":["https://openalex.org/I1328775524"]},{"raw_affiliation_string":"School of Computer Science and Technology, Zhejiang Sci-Tech University, Hangzhou, China","institution_ids":["https://openalex.org/I1328775524"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012637690","display_name":"Haixiang Zhang","orcid":"https://orcid.org/0009-0004-5802-1645"},"institutions":[{"id":"https://openalex.org/I1328775524","display_name":"Zhejiang Sci-Tech University","ror":"https://ror.org/03893we55","country_code":"CN","type":"education","lineage":["https://openalex.org/I1328775524"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haixiang Zhang","raw_affiliation_strings":["Zhejiang Sci-Tech University,School of Computer Science and Technology,Hangzhou,China","School of Computer Science and Technology, Zhejiang Sci-Tech University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang Sci-Tech University,School of Computer Science and Technology,Hangzhou,China","institution_ids":["https://openalex.org/I1328775524"]},{"raw_affiliation_string":"School of Computer Science and Technology, Zhejiang Sci-Tech University, Hangzhou, China","institution_ids":["https://openalex.org/I1328775524"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101196349","display_name":"Hanjie Ma","orcid":null},"institutions":[{"id":"https://openalex.org/I1328775524","display_name":"Zhejiang Sci-Tech University","ror":"https://ror.org/03893we55","country_code":"CN","type":"education","lineage":["https://openalex.org/I1328775524"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hanjie Ma","raw_affiliation_strings":["Zhejiang Sci-Tech University,School of Computer Science and Technology,Hangzhou,China","School of Computer Science and Technology, Zhejiang Sci-Tech University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang Sci-Tech University,School of Computer Science and Technology,Hangzhou,China","institution_ids":["https://openalex.org/I1328775524"]},{"raw_affiliation_string":"School of Computer Science and Technology, Zhejiang Sci-Tech University, Hangzhou, China","institution_ids":["https://openalex.org/I1328775524"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052017667","display_name":"Jie Feng","orcid":"https://orcid.org/0000-0001-9496-0034"},"institutions":[{"id":"https://openalex.org/I1328775524","display_name":"Zhejiang Sci-Tech University","ror":"https://ror.org/03893we55","country_code":"CN","type":"education","lineage":["https://openalex.org/I1328775524"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Feng","raw_affiliation_strings":["Zhejiang Sci-Tech University,School of Computer Science and Technology,Hangzhou,China","School of Computer Science and Technology, Zhejiang Sci-Tech University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang Sci-Tech University,School of Computer Science and Technology,Hangzhou,China","institution_ids":["https://openalex.org/I1328775524"]},{"raw_affiliation_string":"School of Computer Science and Technology, Zhejiang Sci-Tech University, Hangzhou, China","institution_ids":["https://openalex.org/I1328775524"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002822938","display_name":"Mingfeng Jiang","orcid":"https://orcid.org/0000-0003-3013-4790"},"institutions":[{"id":"https://openalex.org/I1328775524","display_name":"Zhejiang Sci-Tech University","ror":"https://ror.org/03893we55","country_code":"CN","type":"education","lineage":["https://openalex.org/I1328775524"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingfeng Jiang","raw_affiliation_strings":["Zhejiang Sci-Tech University,School of Computer Science and Technology,Hangzhou,China","School of Computer Science and Technology, Zhejiang Sci-Tech University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang Sci-Tech University,School of Computer Science and Technology,Hangzhou,China","institution_ids":["https://openalex.org/I1328775524"]},{"raw_affiliation_string":"School of Computer Science and Technology, Zhejiang Sci-Tech University, Hangzhou, China","institution_ids":["https://openalex.org/I1328775524"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100367937"],"corresponding_institution_ids":["https://openalex.org/I1328775524"],"apc_list":null,"apc_paid":null,"fwci":0.265,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.4695507,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"5100","last_page":"5104"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.992900013923645,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12740","display_name":"Gait Recognition and Analysis","score":0.991599977016449,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.9243493676185608},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7135517001152039},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.6412913799285889},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6070010662078857},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.5496911406517029},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5008621215820312},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.37615707516670227},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.36323320865631104},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.20291587710380554},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.13018646836280823},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.07973915338516235},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.07127350568771362}],"concepts":[{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.9243493676185608},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7135517001152039},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.6412913799285889},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6070010662078857},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.5496911406517029},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5008621215820312},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.37615707516670227},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.36323320865631104},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.20291587710380554},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.13018646836280823},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.07973915338516235},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.07127350568771362},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp48485.2024.10448008","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp48485.2024.10448008","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.6100000143051147,"id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W2113325037","https://openalex.org/W2307770531","https://openalex.org/W2754854484","https://openalex.org/W2896457183","https://openalex.org/W2916798096","https://openalex.org/W2963402313","https://openalex.org/W2964221239","https://openalex.org/W2991479034","https://openalex.org/W3005927085","https://openalex.org/W3034999214","https://openalex.org/W3121523901","https://openalex.org/W3139887931","https://openalex.org/W3158818292","https://openalex.org/W3168124404","https://openalex.org/W3171398643","https://openalex.org/W3176892444","https://openalex.org/W3203925315","https://openalex.org/W3213792864","https://openalex.org/W4213332096","https://openalex.org/W4214508443","https://openalex.org/W4226549668","https://openalex.org/W4229005866","https://openalex.org/W4289047567","https://openalex.org/W4312290555","https://openalex.org/W4312614783","https://openalex.org/W4312677967","https://openalex.org/W4313349624","https://openalex.org/W4381252798","https://openalex.org/W4382239283","https://openalex.org/W6755207826","https://openalex.org/W6757733370","https://openalex.org/W6794073987","https://openalex.org/W6796494063","https://openalex.org/W6803650990","https://openalex.org/W6811272755","https://openalex.org/W6811340617"],"related_works":["https://openalex.org/W4388335561","https://openalex.org/W2970530566","https://openalex.org/W4288261899","https://openalex.org/W4307309205","https://openalex.org/W2967478618","https://openalex.org/W4385009901","https://openalex.org/W4385572700","https://openalex.org/W2997152889","https://openalex.org/W4387768015","https://openalex.org/W4304700937"],"abstract_inverted_index":{"In":[0],"recent":[1],"years,":[2],"Transformers":[3],"have":[4],"been":[5],"widely":[6],"applied":[7],"in":[8,24],"human":[9,47,66],"pose":[10,48],"estimation":[11],"by":[12,138],"converting":[13],"image":[14],"features":[15,54,113],"into":[16,82],"token":[17,74,79,92,99,102,124],"forms":[18],"as":[19,35],"inputs.":[20],"However,":[21],"redundant":[22],"information":[23],"images":[25],"burdens":[26],"the":[27,65,88,117],"network":[28,109],"and":[29,62,77,100],"can":[30],"even":[31],"negatively":[32],"impact":[33],"training":[34],"noise.":[36],"Thus,":[37],"we":[38],"propose":[39],"a":[40,56,69,83,106],"coarse-to-fine":[41],"Transformer":[42],"called":[43],"CFPose":[44,134],"for":[45,120,130],"efficient":[46],"estimation.":[49],"We":[50],"first":[51],"extract":[52],"visual":[53],"through":[55],"backbone":[57],"network,":[58],"then":[59],"remove":[60],"redundancy":[61],"coarsely":[63],"crop":[64],"figure":[67],"via":[68],"coarse-grained":[70],"decision":[71,108],"network.":[72],"Coarse-Grained":[73],"(CG":[75],"token)":[76,104],"keypoint":[78,91,98,123,131],"are":[80,114,125],"fed":[81],"two-stage":[84],"Transformer,":[85],"where":[86],"after":[87],"CG":[89],"encoder,":[90],"sufficiently":[93],"incorporate":[94],"coarse":[95],"features.":[96],"Only":[97],"Fine-Grained":[101],"(FG":[103],"from":[105],"fine-grained":[107],"that":[110],"further":[111],"segments":[112],"input":[115],"to":[116,127,143],"FG":[118],"encoder":[119],"training.":[121],"Finally,":[122],"mapped":[126],"2D":[128],"heatmaps":[129],"prediction.":[132],"Impressively,":[133],"reduces":[135],"computational":[136],"complexity":[137],"43%":[139],"while":[140],"improving":[141],"accuracy":[142],"76.2%":[144],"on":[145,152],"COCO.":[146],"It":[147],"also":[148],"achieves":[149],"competitive":[150],"results":[151],"MPII.":[153]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-01-13T01:12:25.745995","created_date":"2025-10-10T00:00:00"}
