{"id":"https://openalex.org/W3201881652","doi":"https://doi.org/10.1145/3467707.3467729","title":"A New Head Pose Estimation Method Using Vision Transformer Model","display_name":"A New Head Pose Estimation Method Using Vision Transformer Model","publication_year":2021,"publication_date":"2021-04-23","ids":{"openalex":"https://openalex.org/W3201881652","doi":"https://doi.org/10.1145/3467707.3467729","mag":"3201881652"},"language":"en","primary_location":{"id":"doi:10.1145/3467707.3467729","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3467707.3467729","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 7th International Conference on Computing and Artificial Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086015675","display_name":"Xufeng Ling","orcid":"https://orcid.org/0000-0001-5217-3614"},"institutions":[{"id":"https://openalex.org/I21945476","display_name":"Shanghai Normal University","ror":"https://ror.org/01cxqmw89","country_code":"CN","type":"education","lineage":["https://openalex.org/I21945476"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xufeng Ling","raw_affiliation_strings":["Shanghai Normal University Tianhua College, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Normal University Tianhua College, China","institution_ids":["https://openalex.org/I21945476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100391437","display_name":"Dong Wang","orcid":"https://orcid.org/0000-0001-9457-263X"},"institutions":[{"id":"https://openalex.org/I21945476","display_name":"Shanghai Normal University","ror":"https://ror.org/01cxqmw89","country_code":"CN","type":"education","lineage":["https://openalex.org/I21945476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dong Wang","raw_affiliation_strings":["Shanghai Normal University Tianhua College, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Normal University Tianhua College, China","institution_ids":["https://openalex.org/I21945476"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100404947","display_name":"Jie Yang","orcid":"https://orcid.org/0000-0003-4801-7162"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Yang","raw_affiliation_strings":["Shanghai Jiaotong University, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiaotong University, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5086015675"],"corresponding_institution_ids":["https://openalex.org/I21945476"],"apc_list":null,"apc_paid":null,"fwci":0.2882,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.5603268,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"154","last_page":"159"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9803000092506409,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.682003378868103},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.6487921476364136},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6118558645248413},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.610663652420044},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6106359958648682},{"id":"https://openalex.org/keywords/3d-pose-estimation","display_name":"3D pose estimation","score":0.47212085127830505},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.16356593370437622},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.08167219161987305}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.682003378868103},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.6487921476364136},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6118558645248413},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.610663652420044},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6106359958648682},{"id":"https://openalex.org/C36613465","wikidata":"https://www.wikidata.org/wiki/Q4636322","display_name":"3D pose estimation","level":3,"score":0.47212085127830505},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.16356593370437622},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.08167219161987305},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3467707.3467729","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3467707.3467729","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 7th International Conference on Computing and Artificial Intelligence","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":8,"referenced_works":["https://openalex.org/W1991544872","https://openalex.org/W2097649661","https://openalex.org/W3094502228","https://openalex.org/W3119997354","https://openalex.org/W3187418919","https://openalex.org/W4240153047","https://openalex.org/W4297792979","https://openalex.org/W4324085337"],"related_works":["https://openalex.org/W4299360450","https://openalex.org/W2567319754","https://openalex.org/W2064877078","https://openalex.org/W2952510816","https://openalex.org/W2154613448","https://openalex.org/W4306804934","https://openalex.org/W1968716783","https://openalex.org/W2963043350","https://openalex.org/W2085100591","https://openalex.org/W2004095265"],"abstract_inverted_index":{"In":[0],"this":[1,61],"paper,":[2],"a":[3,33,42],"self-attention-based":[4],"Vision":[5],"Transformer":[6],"(VIT)":[7],"method":[8],"is":[9,22,30,39,87,99],"introduced":[10],"into":[11,24],"estimate":[12,70],"human":[13],"head":[14,19,104,123],"pose":[15,20,105,124],"parameters.":[16,72],"Firstly,":[17],"the":[18,36,49,57,66,71,80,90,96,103],"image":[21,28,38],"divided":[23],"32X32":[25],"patches,":[26],"each":[27],"patch":[29],"regarded":[31,55],"as":[32,41,56,79],"word,":[34],"and":[35,82,92,118],"whole":[37],"treated":[40],"paragraph":[43],"composed":[44],"of":[45,60],"n":[46],"words":[47],"by":[48],"VIT.":[50],"Image":[51],"recognition":[52,59],"can":[53],"be":[54],"semantic":[58],"paragraph.":[62],"Next,":[63],"we":[64,74],"redesign":[65],"regression":[67],"VIT":[68,86,98,114],"to":[69,101],"Then":[73],"select":[75],"Head":[76],"Pose":[77],"Database":[78],"training":[81],"validation":[83],"dataset.":[84,94],"The":[85],"trained":[88,97],"on":[89,107],"enhanced":[91],"normalized":[93],"Finally,":[95],"used":[100],"regress":[102],"parameters":[106],"testing":[108],"samples.":[109],"Experimental":[110],"results":[111],"show":[112],"that":[113],"has":[115],"high":[116],"accuracy":[117],"good":[119],"generalization":[120],"ability":[121],"for":[122],"estimation.":[125]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
