{"id":"https://openalex.org/W4390047164","doi":"https://doi.org/10.48550/arxiv.2312.12042","title":"Pose2Gaze: Eye-body Coordination during Daily Activities for Gaze Prediction from Full-body Poses","display_name":"Pose2Gaze: Eye-body Coordination during Daily Activities for Gaze Prediction from Full-body Poses","publication_year":2023,"publication_date":"2023-12-19","ids":{"openalex":"https://openalex.org/W4390047164","doi":"https://doi.org/10.48550/arxiv.2312.12042"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2312.12042","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2312.12042","pdf_url":"https://arxiv.org/pdf/2312.12042","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2312.12042","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101425139","display_name":"Zhiming Hu","orcid":"https://orcid.org/0000-0002-2422-8099"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Hu, Zhiming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101985461","display_name":"Jiahui Xu","orcid":"https://orcid.org/0000-0001-9033-8715"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Jiahui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052810943","display_name":"Syn Schmitt","orcid":"https://orcid.org/0000-0002-7768-8961"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schmitt, Syn","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5073661463","display_name":"Andreas Bulling","orcid":"https://orcid.org/0000-0001-6317-7303"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bulling, Andreas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101425139"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9801999926567078,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9560999870300293,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/gaze","display_name":"Gaze","score":0.7941281199455261},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7278647422790527},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6613154411315918},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6591528058052063},{"id":"https://openalex.org/keywords/eye-movement","display_name":"Eye movement","score":0.5933352708816528},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5454933047294617},{"id":"https://openalex.org/keywords/eye\u2013hand-coordination","display_name":"Eye\u2013hand coordination","score":0.5298086404800415},{"id":"https://openalex.org/keywords/eye-tracking","display_name":"Eye tracking","score":0.5022857189178467},{"id":"https://openalex.org/keywords/virtual-reality","display_name":"Virtual reality","score":0.45477908849716187},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.426638126373291}],"concepts":[{"id":"https://openalex.org/C2779916870","wikidata":"https://www.wikidata.org/wiki/Q14467155","display_name":"Gaze","level":2,"score":0.7941281199455261},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7278647422790527},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6613154411315918},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6591528058052063},{"id":"https://openalex.org/C153050134","wikidata":"https://www.wikidata.org/wiki/Q760256","display_name":"Eye movement","level":2,"score":0.5933352708816528},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5454933047294617},{"id":"https://openalex.org/C122434488","wikidata":"https://www.wikidata.org/wiki/Q565578","display_name":"Eye\u2013hand coordination","level":2,"score":0.5298086404800415},{"id":"https://openalex.org/C56461940","wikidata":"https://www.wikidata.org/wiki/Q970687","display_name":"Eye tracking","level":2,"score":0.5022857189178467},{"id":"https://openalex.org/C194969405","wikidata":"https://www.wikidata.org/wiki/Q170519","display_name":"Virtual reality","level":2,"score":0.45477908849716187},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.426638126373291},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2312.12042","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2312.12042","pdf_url":"https://arxiv.org/pdf/2312.12042","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2312.12042","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2312.12042","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2312.12042","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2312.12042","pdf_url":"https://arxiv.org/pdf/2312.12042","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5543094940","display_name":null,"funder_award_id":"EXC 2075 -390740016","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"},{"id":"https://openalex.org/G7249683039","display_name":null,"funder_award_id":"EXC 2075","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"},{"id":"https://openalex.org/G8784604414","display_name":null,"funder_award_id":"390740016","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"}],"funders":[{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4390047164.pdf","grobid_xml":"https://content.openalex.org/works/W4390047164.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4384434815","https://openalex.org/W2161294397","https://openalex.org/W2012644758","https://openalex.org/W1701036363","https://openalex.org/W2958385752","https://openalex.org/W1561131412","https://openalex.org/W1981014703","https://openalex.org/W4206950173","https://openalex.org/W2186236678","https://openalex.org/W2113629050"],"abstract_inverted_index":{"Human":[0],"eye":[1,89,164,175],"gaze":[2,29,90,107,176,251],"plays":[3],"a":[4,47,105,127,134,139,158,247],"significant":[5,234],"role":[6],"in":[7,53,66,82,98,206,221,238],"many":[8],"virtual":[9],"and":[10,31,38,56,76,87,103,138,151,155,181,202,244],"augmented":[11],"reality":[12],"(VR/AR)":[13],"applications,":[14],"such":[15],"as":[16,71,73],"gaze-contingent":[17],"rendering,":[18],"gaze-based":[19],"interaction,":[20],"or":[21],"eye-based":[22,227],"activity":[23,228],"recognition.":[24,229],"However,":[25],"prior":[26,219],"works":[27],"on":[28,61,194,197,200,204],"analysis":[30,49],"prediction":[32],"have":[33],"only":[34,177],"explored":[35],"eye-head":[36],"coordination":[37,52,130,240],"were":[39],"limited":[40],"to":[41,145,162],"human-object":[42,55,83],"interactions.":[43],"We":[44,79,166,211],"first":[45],"report":[46],"comprehensive":[48],"of":[50,192,226],"eye-body":[51,129,239],"various":[54],"human-human":[57,99],"interaction":[58,117],"activities":[59,243],"based":[60],"four":[62],"public":[63],"datasets":[64],"collected":[65],"real-world":[67],"(MoGaze),":[68],"VR":[69],"(ADT),":[70],"well":[72],"AR":[74],"(GIMO":[75],"EgoBody)":[77],"environments.":[78],"show":[80,182,213],"that":[81,132,173,183,214],"interactions,":[84,100],"e.g.":[85,101],"pick":[86],"place,":[88],"exhibits":[91],"strong":[92],"correlations":[93],"with":[94,111,170,188],"full-body":[95,152],"motion":[96],"while":[97],"chat":[102],"teach,":[104],"person's":[106],"direction":[108,150,249],"is":[109],"correlated":[110],"the":[112,116,222,233],"body":[113],"orientation":[114],"towards":[115],"partner.":[118],"Informed":[119],"by":[120],"these":[121,186],"analyses":[122],"we":[123],"then":[124,156],"present":[125],"Pose2Gaze,":[126],"novel":[128],"model":[131],"uses":[133,157],"convolutional":[135,142,159],"neural":[136,143,160],"network":[137,144,161],"spatio-temporal":[140],"graph":[141],"extract":[146],"features":[147],"from":[148,178],"head":[149,179],"poses,":[153],"respectively,":[154],"predict":[163,174],"gaze.":[165],"compare":[167],"our":[168,215],"method":[169,216],"state-of-the-art":[171],"methods":[172,220],"movements":[180],"Pose2Gaze":[184],"outperforms":[185,218],"baselines":[187],"an":[189],"average":[190],"improvement":[191],"24.0%":[193],"MoGaze,":[195],"10.1%":[196],"ADT,":[198],"21.3%":[199],"GIMO,":[201],"28.6%":[203],"EgoBody":[205],"mean":[207],"angular":[208],"error,":[209],"respectively.":[210],"also":[212],"significantly":[217],"sample":[223],"downstream":[224],"task":[225],"These":[230],"results":[231],"underline":[232],"information":[235],"content":[236],"available":[237],"during":[241],"daily":[242],"open":[245],"up":[246],"new":[248],"for":[250],"prediction.":[252]},"counts_by_year":[],"updated_date":"2026-05-02T08:42:23.175194","created_date":"2023-12-22T00:00:00"}
