{"id":"https://openalex.org/W2092760152","doi":"https://doi.org/10.1145/2535948.2535953","title":"Mutual disambiguation of eye gaze and speech for sight translation and reading","display_name":"Mutual disambiguation of eye gaze and speech for sight translation and reading","publication_year":2013,"publication_date":"2013-11-26","ids":{"openalex":"https://openalex.org/W2092760152","doi":"https://doi.org/10.1145/2535948.2535953","mag":"2092760152"},"language":"en","primary_location":{"id":"doi:10.1145/2535948.2535953","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2535948.2535953","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 6th workshop on Eye gaze in intelligent human machine interaction: gaze in multimodal interaction","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5005043203","display_name":"Rucha Kulkarni","orcid":"https://orcid.org/0000-0002-7636-6856"},"institutions":[{"id":"https://openalex.org/I162827531","display_name":"Indian Institute of Technology Bombay","ror":"https://ror.org/02qyf5152","country_code":"IN","type":"education","lineage":["https://openalex.org/I162827531"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Rucha Kulkarni","raw_affiliation_strings":["Indian Institute of Technology, Bombay, Mumbai, India","Indian Institute of Technology-Bombay, Mumbai, India#TAB#"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology, Bombay, Mumbai, India","institution_ids":["https://openalex.org/I162827531"]},{"raw_affiliation_string":"Indian Institute of Technology-Bombay, Mumbai, India#TAB#","institution_ids":["https://openalex.org/I162827531"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065415798","display_name":"Kritika Jain","orcid":null},"institutions":[{"id":"https://openalex.org/I162827531","display_name":"Indian Institute of Technology Bombay","ror":"https://ror.org/02qyf5152","country_code":"IN","type":"education","lineage":["https://openalex.org/I162827531"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Kritika Jain","raw_affiliation_strings":["Indian Institute of Technology, Bombay, Mumbai, India","Indian Institute of Technology-Bombay, Mumbai, India#TAB#"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology, Bombay, Mumbai, India","institution_ids":["https://openalex.org/I162827531"]},{"raw_affiliation_string":"Indian Institute of Technology-Bombay, Mumbai, India#TAB#","institution_ids":["https://openalex.org/I162827531"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014894459","display_name":"Himanshu Bansal","orcid":"https://orcid.org/0000-0002-9487-3472"},"institutions":[{"id":"https://openalex.org/I1317621060","display_name":"Indian Institute of Technology Guwahati","ror":"https://ror.org/0022nd079","country_code":"IN","type":"education","lineage":["https://openalex.org/I1317621060"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Himanshu Bansal","raw_affiliation_strings":["Indian Institute of Technology, Guwahati, Guwahati, India"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology, Guwahati, Guwahati, India","institution_ids":["https://openalex.org/I1317621060"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111475783","display_name":"Srinivas Bangalore","orcid":null},"institutions":[{"id":"https://openalex.org/I1283103587","display_name":"AT&T (United States)","ror":"https://ror.org/02bbd5539","country_code":"US","type":"company","lineage":["https://openalex.org/I1283103587"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Srinivas Bangalore","raw_affiliation_strings":["AT&amp;T Research, New Jearsey, USA"],"affiliations":[{"raw_affiliation_string":"AT&amp;T Research, New Jearsey, USA","institution_ids":["https://openalex.org/I1283103587"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5085495324","display_name":"Micha\u00ebl Carl","orcid":"https://orcid.org/0000-0002-2815-0292"},"institutions":[{"id":"https://openalex.org/I180519160","display_name":"Copenhagen Business School","ror":"https://ror.org/04sppb023","country_code":"DK","type":"education","lineage":["https://openalex.org/I180519160"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Michael Carl","raw_affiliation_strings":["Copenhagen Business School, Copenhagen, Denmark"],"affiliations":[{"raw_affiliation_string":"Copenhagen Business School, Copenhagen, Denmark","institution_ids":["https://openalex.org/I180519160"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5005043203"],"corresponding_institution_ids":["https://openalex.org/I162827531"],"apc_list":null,"apc_paid":null,"fwci":0.6356,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.72632998,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"35","last_page":"40"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9589999914169312,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.824608564376831},{"id":"https://openalex.org/keywords/gaze","display_name":"Gaze","score":0.6958140134811401},{"id":"https://openalex.org/keywords/eye-tracking","display_name":"Eye tracking","score":0.6097522377967834},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.580162525177002},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.5446516871452332},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5099495649337769},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5032255053520203},{"id":"https://openalex.org/keywords/usable","display_name":"USable","score":0.4662892520427704},{"id":"https://openalex.org/keywords/speech-translation","display_name":"Speech translation","score":0.46133530139923096},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.4458676278591156},{"id":"https://openalex.org/keywords/sight","display_name":"Sight","score":0.4291546046733856},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4261529743671417},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.08381730318069458}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.824608564376831},{"id":"https://openalex.org/C2779916870","wikidata":"https://www.wikidata.org/wiki/Q14467155","display_name":"Gaze","level":2,"score":0.6958140134811401},{"id":"https://openalex.org/C56461940","wikidata":"https://www.wikidata.org/wiki/Q970687","display_name":"Eye tracking","level":2,"score":0.6097522377967834},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.580162525177002},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.5446516871452332},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5099495649337769},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5032255053520203},{"id":"https://openalex.org/C2780615836","wikidata":"https://www.wikidata.org/wiki/Q2471869","display_name":"USable","level":2,"score":0.4662892520427704},{"id":"https://openalex.org/C2780366754","wikidata":"https://www.wikidata.org/wiki/Q7494857","display_name":"Speech translation","level":3,"score":0.46133530139923096},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.4458676278591156},{"id":"https://openalex.org/C1517167","wikidata":"https://www.wikidata.org/wiki/Q1134322","display_name":"Sight","level":2,"score":0.4291546046733856},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4261529743671417},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.08381730318069458},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/2535948.2535953","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2535948.2535953","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 6th workshop on Eye gaze in intelligent human machine interaction: gaze in multimodal interaction","raw_type":"proceedings-article"},{"id":"pmh:oai:research-api.cbs.dk:openaire_cris_publications/29a0b0e0-cbac-4a94-8f9a-2d5ac63cc1a8","is_oa":false,"landing_page_url":"https://research.cbs.dk/en/publications/29a0b0e0-cbac-4a94-8f9a-2d5ac63cc1a8","pdf_url":null,"source":{"id":"https://openalex.org/S4306401458","display_name":"CBS Research Portal (Copenhagen Business School)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I180519160","host_organization_name":"Copenhagen Business School","host_organization_lineage":["https://openalex.org/I180519160"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Kulkarni , R, Jain, K, Bansal, H, Bangalore, S & Carl, M 2013, 'Mutual Disambiguation of Eye Gaze and Speech for Sight Translation and Reading', Paper presented at 10th International Conference on Natural Language Processing, Noida, India, 18/12/2013 - 20/12/2013.","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:research-api.cbs.dk:openaire_cris_publications/35aaee7f-36c5-4d3c-a758-e75db7245332","is_oa":false,"landing_page_url":"https://research.cbs.dk/en/publications/35aaee7f-36c5-4d3c-a758-e75db7245332","pdf_url":null,"source":{"id":"https://openalex.org/S4306401458","display_name":"CBS Research Portal (Copenhagen Business School)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I180519160","host_organization_name":"Copenhagen Business School","host_organization_lineage":["https://openalex.org/I180519160"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Kulkarni , R, Jain, K, Bansal, H, Bangalore, S & Carl, M 2013, Mutual Disambiguation of Eye Gaze and Speech for Sight Translation and Reading. in R Bednarik , H-H Huang , K Jokinen & Y I Nakano (eds), GazeIn '13. Proceedings of the 6th Workshop on Eye Gaze in Intelligent Human Machine Interaction : Gaze in Multimodal Interaction . Association for Computing Machinery, New York, pp. 35-40, The 6th Workshop on Eye Gaze in Intelligent Human Machine Interaction. GazeIn '13, Sydney, Australia, 13/12/2013. https://doi.org/10.1145/2535948.2535953","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.800000011920929,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W171075636","https://openalex.org/W1980120944","https://openalex.org/W1982816048","https://openalex.org/W1986450680","https://openalex.org/W1991087539","https://openalex.org/W1997594216","https://openalex.org/W2008517591","https://openalex.org/W2037442428","https://openalex.org/W2044268022","https://openalex.org/W2080320702","https://openalex.org/W2083325968","https://openalex.org/W2086458350","https://openalex.org/W2090965804","https://openalex.org/W2098976116","https://openalex.org/W2137066512","https://openalex.org/W4233530569","https://openalex.org/W6680542389"],"related_works":["https://openalex.org/W2982321410","https://openalex.org/W3214178347","https://openalex.org/W2353119552","https://openalex.org/W2364379655","https://openalex.org/W2808673637","https://openalex.org/W2392004567","https://openalex.org/W2408516727","https://openalex.org/W2990201137","https://openalex.org/W2940029036","https://openalex.org/W4388292429"],"abstract_inverted_index":{"Researchers":[0],"are":[1,28],"proposing":[2],"interactive":[3],"machine":[4],"translation":[5,13,38,83,132],"as":[6,108],"a":[7,60,119],"potential":[8],"method":[9],"to":[10,31,33,110],"make":[11],"language":[12,37],"process":[14],"more":[15],"efficient":[16],"and":[17,26,50,55,71,84,88,101,126],"usable.":[18],"Introduction":[19],"of":[20,36,66,76,81,90],"different":[21],"modalities":[22,93],"like":[23],"eye":[24],"gaze":[25,139],"speech":[27,70,127],"being":[29],"explored":[30],"add":[32],"the":[34,41,64,67,74,91],"interactivity":[35],"system.":[39],"Unfortunately,":[40],"raw":[42],"data":[43],"provided":[44],"by":[45],"Automatic":[46],"Speech":[47],"Recognition":[48],"(ASR)":[49],"Eye-Tracking":[51],"is":[52],"very":[53],"noisy":[54],"erroneous.":[56],"This":[57],"paper":[58],"describes":[59],"technique":[61],"for":[62,96,99,104],"reducing":[63],"errors":[65],"two":[68,92],"modalities,":[69],"eye-gaze":[72],"with":[73],"help":[75],"each":[77],"other":[78],"in":[79,122,138,143],"context":[80],"sight":[82,131],"reading.":[85],"Lattice":[86],"representation":[87],"composition":[89],"was":[94,136],"used":[95,107],"integration.":[97],"F-measure":[98],"Eye-Gaze":[100,124],"Word":[102,128],"Accuracy":[103],"ASR":[105],"were":[106],"metrics":[109],"evaluate":[111],"our":[112],"results.":[113],"In":[114,130],"reading":[115],"task,":[116,133],"we":[117],"demonstrated":[118],"significant":[120,134],"improvement":[121,135],"both":[123],"f-measure":[125,140],"Accuracy.":[129],"found":[137],"but":[141],"not":[142],"ASR.":[144]},"counts_by_year":[{"year":2014,"cited_by_count":2}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
