{"id":"https://openalex.org/W4416256040","doi":"https://doi.org/10.48550/arxiv.2509.19574","title":"Mouse-Guided Gaze: Semi-Supervised Learning of Intention-Aware Representations for Reading Detection","display_name":"Mouse-Guided Gaze: Semi-Supervised Learning of Intention-Aware Representations for Reading Detection","publication_year":2025,"publication_date":"2025-09-23","ids":{"openalex":"https://openalex.org/W4416256040","doi":"https://doi.org/10.48550/arxiv.2509.19574"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2509.19574","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.19574","pdf_url":"https://arxiv.org/pdf/2509.19574","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2509.19574","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022925970","display_name":"Seongsil Heo","orcid":"https://orcid.org/0000-0002-7785-8473"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Heo, Seongsil","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5075120422","display_name":"Roberto Manduchi","orcid":"https://orcid.org/0000-0003-2640-302X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Manduchi, Roberto","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.9550999999046326,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.9550999999046326,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10789","display_name":"Interactive and Immersive Displays","score":0.013000000268220901,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10914","display_name":"Tactile and Sensory Interactions","score":0.00570000009611249,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/gaze","display_name":"Gaze","score":0.7028999924659729},{"id":"https://openalex.org/keywords/viewport","display_name":"Viewport","score":0.6406999826431274},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6004999876022339},{"id":"https://openalex.org/keywords/reading","display_name":"Reading (process)","score":0.5827000141143799},{"id":"https://openalex.org/keywords/eye-tracking","display_name":"Eye tracking","score":0.4661000072956085},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.3127000033855438}],"concepts":[{"id":"https://openalex.org/C2779916870","wikidata":"https://www.wikidata.org/wiki/Q14467155","display_name":"Gaze","level":2,"score":0.7028999924659729},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6848999857902527},{"id":"https://openalex.org/C2778090530","wikidata":"https://www.wikidata.org/wiki/Q2523931","display_name":"Viewport","level":2,"score":0.6406999826431274},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6004999876022339},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5911999940872192},{"id":"https://openalex.org/C554936623","wikidata":"https://www.wikidata.org/wiki/Q199657","display_name":"Reading (process)","level":2,"score":0.5827000141143799},{"id":"https://openalex.org/C56461940","wikidata":"https://www.wikidata.org/wiki/Q970687","display_name":"Eye tracking","level":2,"score":0.4661000072956085},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.35350000858306885},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.3127000033855438},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.30660000443458557},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.2854999899864197},{"id":"https://openalex.org/C4144372","wikidata":"https://www.wikidata.org/wiki/Q675287","display_name":"Magnification","level":2,"score":0.2809000015258789},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.26669999957084656},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.2606000006198883},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.25870001316070557},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.2581000030040741},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.25589999556541443},{"id":"https://openalex.org/C198352243","wikidata":"https://www.wikidata.org/wiki/Q37105","display_name":"Line (geometry)","level":2,"score":0.25589999556541443}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2509.19574","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.19574","pdf_url":"https://arxiv.org/pdf/2509.19574","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2509.19574","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2509.19574","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2509.19574","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.19574","pdf_url":"https://arxiv.org/pdf/2509.19574","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Understanding":[0],"user":[1],"intent":[2],"during":[3],"magnified":[4,77],"reading":[5,28,63],"is":[6,49],"critical":[7],"for":[8,127,134],"accessible":[9],"interface":[10],"design.":[11],"Yet":[12],"magnification":[13],"collapses":[14],"visual":[15],"context":[16],"and":[17,26,79,94,98],"forces":[18],"continual":[19],"viewport":[20,78],"dragging,":[21],"producing":[22],"fragmented,":[23],"noisy":[24],"gaze":[25,38,74],"obscuring":[27],"intent.":[29],"We":[30],"present":[31],"a":[32,80],"semi-supervised":[33,108],"framework":[34],"that":[35],"learns":[36],"intention-aware":[37],"representations":[39],"by":[40],"leveraging":[41],"mouse":[42,54],"trajectories":[43],"as":[44],"weak":[45],"supervision.":[46],"The":[47],"model":[48,72],"first":[50],"pretrained":[51],"to":[52,61,84,112],"predict":[53],"velocity":[55],"from":[56],"unlabeled":[57],"gaze,":[58],"then":[59],"fine-tuned":[60],"classify":[62],"versus":[64],"scanning.":[65],"To":[66],"address":[67],"magnification-induced":[68],"distortions,":[69],"we":[70],"jointly":[71],"raw":[73],"within":[75],"the":[76,85,122,132],"compensated":[81],"view":[82],"remapped":[83],"original":[86],"screen,":[87],"which":[88],"restores":[89],"spatial":[90],"continuity":[91],"across":[92],"lines":[93],"paragraphs.":[95],"Across":[96],"text":[97],"webpage":[99],"datasets,":[100],"our":[101],"approach":[102],"consistently":[103],"outperforms":[104],"supervised":[105],"baselines,":[106],"with":[107],"pretraining":[109,126],"yielding":[110],"up":[111],"7.5%":[113],"F1":[114],"improvement":[115],"in":[116],"challenging":[117],"settings.":[118],"These":[119],"findings":[120],"highlight":[121],"value":[123],"of":[124],"behavior-driven":[125],"robust,":[128],"gaze-only":[129],"interaction,":[130],"paving":[131],"way":[133],"adaptive,":[135],"hands-free":[136],"accessibility":[137],"tools.":[138]},"counts_by_year":[],"updated_date":"2026-07-01T08:55:40.977307","created_date":"2025-10-10T00:00:00"}
