{"id":"https://openalex.org/W7155394154","doi":"https://doi.org/10.48550/arxiv.2604.20574","title":"Where are they looking in the operating room?","display_name":"Where are they looking in the operating room?","publication_year":2026,"publication_date":"2026-04-22","ids":{"openalex":"https://openalex.org/W7155394154","doi":"https://doi.org/10.48550/arxiv.2604.20574"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.20574","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.20574","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.20574","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134439879","display_name":"Keqi Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Keqi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133046267","display_name":"S\u00e9raphin Baributsa","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Baributsa, S\u00e9raphin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116269235","display_name":"Lilien Schewski","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schewski, Lilien","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134445996","display_name":"Vinkle Srivastav","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Srivastav, Vinkle","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081252567","display_name":"Didier Mutter","orcid":"https://orcid.org/0000-0002-7559-3328"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mutter, Didier","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060499253","display_name":"Guido Beldi","orcid":"https://orcid.org/0000-0002-9914-3807"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Beldi, Guido","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080764037","display_name":"Sandra Keller","orcid":"https://orcid.org/0000-0003-3229-9003"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Keller, Sandra","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134437329","display_name":"Nicolas Padoy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Padoy, Nicolas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10916","display_name":"Surgical Simulation and Training","score":0.31869998574256897,"subfield":{"id":"https://openalex.org/subfields/2746","display_name":"Surgery"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T10916","display_name":"Surgical Simulation and Training","score":0.31869998574256897,"subfield":{"id":"https://openalex.org/subfields/2746","display_name":"Surgery"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.23229999840259552,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.12729999423027039,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.8194000124931335},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6809999942779541},{"id":"https://openalex.org/keywords/gaze","display_name":"Gaze","score":0.6406000256538391},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.40400001406669617},{"id":"https://openalex.org/keywords/surgical-team","display_name":"Surgical team","score":0.328000009059906},{"id":"https://openalex.org/keywords/phase","display_name":"Phase (matter)","score":0.31220000982284546}],"concepts":[{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.8194000124931335},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6809999942779541},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6638000011444092},{"id":"https://openalex.org/C2779916870","wikidata":"https://www.wikidata.org/wiki/Q14467155","display_name":"Gaze","level":2,"score":0.6406000256538391},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4821999967098236},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.44699999690055847},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42969998717308044},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.40400001406669617},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35120001435279846},{"id":"https://openalex.org/C3018700120","wikidata":"https://www.wikidata.org/wiki/Q40821","display_name":"Surgical team","level":2,"score":0.328000009059906},{"id":"https://openalex.org/C44280652","wikidata":"https://www.wikidata.org/wiki/Q104837","display_name":"Phase (matter)","level":2,"score":0.31220000982284546},{"id":"https://openalex.org/C56461940","wikidata":"https://www.wikidata.org/wiki/Q970687","display_name":"Eye tracking","level":2,"score":0.28119999170303345},{"id":"https://openalex.org/C3019611579","wikidata":"https://www.wikidata.org/wiki/Q6641956","display_name":"Surgical procedures","level":2,"score":0.26809999346733093},{"id":"https://openalex.org/C12269588","wikidata":"https://www.wikidata.org/wiki/Q132364","display_name":"Communications protocol","level":2,"score":0.26570001244544983},{"id":"https://openalex.org/C135981907","wikidata":"https://www.wikidata.org/wiki/Q188056","display_name":"Triangulation","level":2,"score":0.2533000111579895}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.20574","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.20574","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.20574","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.20574","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Purpose:":[0],"Gaze-following,":[1],"the":[2,36,60,65,83,88,96,166,178,234],"task":[3],"of":[4,62,200],"inferring":[5],"where":[6,44],"individuals":[7],"are":[8],"looking,":[9],"has":[10,31],"been":[11,33],"widely":[12],"studied":[13],"in":[14,19,35,51,82,154,218,233,241,254],"computer":[15],"vision,":[16],"advancing":[17],"research":[18,239],"visual":[20,45],"attention":[21,46],"modeling,":[22],"social":[23],"scene":[24],"understanding,":[25],"and":[26,68,79,94,101,121,131,163,180,206],"human-robot":[27],"interaction.":[28],"However,":[29],"gaze-following":[30,63,92,100,127,232],"never":[32],"explored":[34],"operating":[37],"room":[38],"(OR),":[39],"a":[40,102,126,136,151,155,169,237],"complex,":[41],"high-stakes":[42],"environment":[43],"plays":[47],"an":[48],"important":[49],"role":[50,116,130,204],"surgical":[52,66,77,118,209,242,251],"workflow":[53,252],"analysis.":[54],"In":[55],"this":[56],"work,":[57],"we":[58,109,134,149],"introduce":[59,231],"concept":[61],"to":[64,113,249],"domain,":[67],"demonstrate":[69,183],"its":[70,246],"great":[71,247],"potential":[72,248],"for":[73,145,202,208],"understanding":[74],"clinical":[75,115,203],"roles,":[76],"phases,":[78],"team":[80,104,122,146,219],"communications":[81],"OR.":[84],"Methods:":[85],"We":[86,230],"extend":[87,95],"4D-OR":[89,179],"dataset":[90,98],"with":[91,99],"annotations,":[93],"Team-OR":[97,181],"new":[103],"communication":[105,123,147,220],"activity":[106,171],"annotations.":[107],"Then,":[108],"propose":[110,135],"novel":[111,238],"approaches":[112],"address":[114],"prediction,":[117],"phase":[119,132,210],"recognition,":[120,133],"detection":[124,172],"using":[125],"model.":[128,173],"For":[129],"gaze":[137,142],"heatmap-based":[138],"approach":[139,186,196],"that":[140,158,184],"uses":[141],"predictions":[143],"solely;":[144],"detection,":[148,221],"train":[150],"spatial-temporal":[152],"model":[153],"self-supervised":[156],"way":[157],"encodes":[159],"gaze-based":[160],"clip":[161],"features,":[162],"then":[164],"feed":[165],"features":[167],"into":[168],"temporal":[170],"Results:":[174],"Experimental":[175],"results":[176],"on":[177,190],"datasets":[182],"our":[185,195],"achieves":[187],"state-of-the-art":[188],"performance":[189],"all":[191],"downstream":[192],"tasks.":[193],"Quantitatively,":[194],"obtains":[197],"F1":[198],"scores":[199],"0.92":[201],"prediction":[205],"0.95":[207],"recognition.":[211],"Furthermore,":[212],"it":[213],"significantly":[214],"outperforms":[215],"existing":[216],"baselines":[217],"improving":[222],"previous":[223],"best":[224],"performances":[225],"by":[226],"over":[227],"30%.":[228],"Conclusion:":[229],"OR":[235],"as":[236],"direction":[240],"data":[243],"science,":[244],"highlighting":[245],"advance":[250],"analysis":[253],"computer-assisted":[255],"interventions.":[256]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-24T00:00:00"}
