{"id":"https://openalex.org/W4409736063","doi":"https://doi.org/10.1145/3706598.3714210","title":"Beyond Visual Perception: Insights from Smartphone Interaction of Visually Impaired Users with Large Multimodal Models","display_name":"Beyond Visual Perception: Insights from Smartphone Interaction of Visually Impaired Users with Large Multimodal Models","publication_year":2025,"publication_date":"2025-04-24","ids":{"openalex":"https://openalex.org/W4409736063","doi":"https://doi.org/10.1145/3706598.3714210","pmid":"https://pubmed.ncbi.nlm.nih.gov/40792292"},"language":"en","primary_location":{"id":"doi:10.1145/3706598.3714210","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3706598.3714210","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 CHI Conference on Human Factors in Computing Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC12338113/pdf/nihms-2046489.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045705100","display_name":"Jingyi Xie","orcid":"https://orcid.org/0000-0002-2753-2360"},"institutions":[{"id":"https://openalex.org/I130769515","display_name":"Pennsylvania State University","ror":"https://ror.org/04p491231","country_code":"US","type":"education","lineage":["https://openalex.org/I130769515"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jingyi Xie","raw_affiliation_strings":["College of Information Sciences and Technology, Pennsylvania State University, University Park, Pennsylvania, USA"],"raw_orcid":"https://orcid.org/0000-0002-2753-2360","affiliations":[{"raw_affiliation_string":"College of Information Sciences and Technology, Pennsylvania State University, University Park, Pennsylvania, USA","institution_ids":["https://openalex.org/I130769515"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082660075","display_name":"Rui Yu","orcid":"https://orcid.org/0000-0002-0946-6769"},"institutions":[{"id":"https://openalex.org/I142740786","display_name":"University of Louisville","ror":"https://ror.org/01ckdn478","country_code":"US","type":"education","lineage":["https://openalex.org/I142740786"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rui Yu","raw_affiliation_strings":["Department of Computer Science and Engineering, University of Louisville, Louisville, Kentucky, USA"],"raw_orcid":"https://orcid.org/0000-0002-0946-6769","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, University of Louisville, Louisville, Kentucky, USA","institution_ids":["https://openalex.org/I142740786"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071350138","display_name":"H. Zhang","orcid":"https://orcid.org/0000-0002-8169-1653"},"institutions":[{"id":"https://openalex.org/I130769515","display_name":"Pennsylvania State University","ror":"https://ror.org/04p491231","country_code":"US","type":"education","lineage":["https://openalex.org/I130769515"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"He Zhang","raw_affiliation_strings":["College of Information Sciences and Technology, Pennsylvania State University, State College, Pennsylvania, USA"],"raw_orcid":"https://orcid.org/0000-0002-8169-1653","affiliations":[{"raw_affiliation_string":"College of Information Sciences and Technology, Pennsylvania State University, State College, Pennsylvania, USA","institution_ids":["https://openalex.org/I130769515"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005834738","display_name":"Syed Masum Billah","orcid":"https://orcid.org/0000-0001-5063-3808"},"institutions":[{"id":"https://openalex.org/I130769515","display_name":"Pennsylvania State University","ror":"https://ror.org/04p491231","country_code":"US","type":"education","lineage":["https://openalex.org/I130769515"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Syed Masum Billah","raw_affiliation_strings":["College of Information Sciences and Technology, Pennsylvania State University, University Park, Pennsylvania, USA"],"raw_orcid":"https://orcid.org/0000-0001-5063-3808","affiliations":[{"raw_affiliation_string":"College of Information Sciences and Technology, Pennsylvania State University, University Park, Pennsylvania, USA","institution_ids":["https://openalex.org/I130769515"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100626494","display_name":"Sooyeon Lee","orcid":"https://orcid.org/0000-0002-4971-2004"},"institutions":[{"id":"https://openalex.org/I118118575","display_name":"New Jersey Institute of Technology","ror":"https://ror.org/05e74xb87","country_code":"US","type":"education","lineage":["https://openalex.org/I118118575"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sooyeon Lee","raw_affiliation_strings":["Ying Wu College of Computing, New Jersey Institute of Technology, Newark, New Jersey, USA"],"raw_orcid":"https://orcid.org/0000-0002-4971-2004","affiliations":[{"raw_affiliation_string":"Ying Wu College of Computing, New Jersey Institute of Technology, Newark, New Jersey, USA","institution_ids":["https://openalex.org/I118118575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5054610664","display_name":"John M. Carroll","orcid":"https://orcid.org/0000-0001-5189-337X"},"institutions":[{"id":"https://openalex.org/I130769515","display_name":"Pennsylvania State University","ror":"https://ror.org/04p491231","country_code":"US","type":"education","lineage":["https://openalex.org/I130769515"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"John M. Carroll","raw_affiliation_strings":["College of Information Sciences and Technology, Pennsylvania State University, University Park, Pennsylvania, USA"],"raw_orcid":"https://orcid.org/0000-0001-5189-337X","affiliations":[{"raw_affiliation_string":"College of Information Sciences and Technology, Pennsylvania State University, University Park, Pennsylvania, USA","institution_ids":["https://openalex.org/I130769515"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5045705100"],"corresponding_institution_ids":["https://openalex.org/I130769515"],"apc_list":null,"apc_paid":null,"fwci":13.9499,"has_fulltext":true,"cited_by_count":11,"citation_normalized_percentile":{"value":0.99118827,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"25","issue":null,"first_page":"1","last_page":"17"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10914","display_name":"Tactile and Sensory Interactions","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10914","display_name":"Tactile and Sensory Interactions","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10789","display_name":"Interactive and Immersive Displays","score":0.9939000010490417,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9878000020980835,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/visually-impaired","display_name":"Visually impaired","score":0.7883316874504089},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.6979107856750488},{"id":"https://openalex.org/keywords/multimodal-interaction","display_name":"Multimodal interaction","score":0.6938725709915161},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6834287643432617},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.6438407301902771},{"id":"https://openalex.org/keywords/visual-impairment","display_name":"Visual impairment","score":0.47453033924102783},{"id":"https://openalex.org/keywords/multimodality","display_name":"Multimodality","score":0.45415085554122925},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.34643852710723877},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.33708250522613525},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32291537523269653},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.1770685613155365},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.12564969062805176}],"concepts":[{"id":"https://openalex.org/C3020106864","wikidata":"https://www.wikidata.org/wiki/Q737460","display_name":"Visually impaired","level":2,"score":0.7883316874504089},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.6979107856750488},{"id":"https://openalex.org/C135641252","wikidata":"https://www.wikidata.org/wiki/Q738567","display_name":"Multimodal interaction","level":2,"score":0.6938725709915161},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6834287643432617},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.6438407301902771},{"id":"https://openalex.org/C2781372952","wikidata":"https://www.wikidata.org/wiki/Q737460","display_name":"Visual impairment","level":2,"score":0.47453033924102783},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.45415085554122925},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.34643852710723877},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.33708250522613525},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32291537523269653},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.1770685613155365},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.12564969062805176},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C118552586","wikidata":"https://www.wikidata.org/wiki/Q7867","display_name":"Psychiatry","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3706598.3714210","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3706598.3714210","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 CHI Conference on Human Factors in Computing Systems","raw_type":"proceedings-article"},{"id":"pmid:40792292","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40792292","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the SIGCHI conference on human factors in computing systems. CHI Conference","raw_type":null},{"id":"pmh:oai:pubmedcentral.nih.gov:12338113","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/12338113","pdf_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC12338113/pdf/nihms-2046489.pdf","source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Proc SIGCHI Conf Hum Factor Comput Syst","raw_type":"Text"}],"best_oa_location":{"id":"pmh:oai:pubmedcentral.nih.gov:12338113","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/12338113","pdf_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC12338113/pdf/nihms-2046489.pdf","source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Proc SIGCHI Conf Hum Factor Comput Syst","raw_type":"Text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7804810424","display_name":null,"funder_award_id":"R01 LM013330","funder_id":"https://openalex.org/F4320332161","funder_display_name":"National Institutes of Health"}],"funders":[{"id":"https://openalex.org/F4320332161","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4409736063.pdf"},"referenced_works_count":53,"referenced_works":["https://openalex.org/W1535763807","https://openalex.org/W1979290264","https://openalex.org/W2004599511","https://openalex.org/W2012339105","https://openalex.org/W2090048052","https://openalex.org/W2095781211","https://openalex.org/W2096031678","https://openalex.org/W2116680608","https://openalex.org/W2124226560","https://openalex.org/W2127428155","https://openalex.org/W2138847321","https://openalex.org/W2140217131","https://openalex.org/W2557827106","https://openalex.org/W2790378580","https://openalex.org/W2963622213","https://openalex.org/W2990138404","https://openalex.org/W2990751682","https://openalex.org/W2998746484","https://openalex.org/W3029394045","https://openalex.org/W3030405946","https://openalex.org/W3030476761","https://openalex.org/W3034700241","https://openalex.org/W3041212832","https://openalex.org/W3106877404","https://openalex.org/W3110019360","https://openalex.org/W3162205072","https://openalex.org/W3164652469","https://openalex.org/W3168398407","https://openalex.org/W3175373394","https://openalex.org/W3185101217","https://openalex.org/W3207136799","https://openalex.org/W4220779313","https://openalex.org/W4220878552","https://openalex.org/W4224936685","https://openalex.org/W4255697435","https://openalex.org/W4281833181","https://openalex.org/W4292260217","https://openalex.org/W4307136615","https://openalex.org/W4383682878","https://openalex.org/W4385894687","https://openalex.org/W4387793598","https://openalex.org/W4393147158","https://openalex.org/W4393969035","https://openalex.org/W4396832221","https://openalex.org/W4396833521","https://openalex.org/W4396833689","https://openalex.org/W4398165080","https://openalex.org/W4399488123","https://openalex.org/W4400648371","https://openalex.org/W4400768356","https://openalex.org/W4403576862","https://openalex.org/W4405862095","https://openalex.org/W4409735071"],"related_works":["https://openalex.org/W2166248296","https://openalex.org/W2995743050","https://openalex.org/W2968820833","https://openalex.org/W2976816735","https://openalex.org/W3022313497","https://openalex.org/W332756932","https://openalex.org/W2068964259","https://openalex.org/W2013013717","https://openalex.org/W66256988","https://openalex.org/W4302857920"],"abstract_inverted_index":{"Large":[0],"multimodal":[1],"models":[2],"(LMMs)":[3],"have":[4],"enabled":[5],"new":[6],"AI-powered":[7],"applications":[8],"that":[9],"help":[10],"people":[11],"with":[12,74],"visual":[13,33],"impairments":[14],"(PVI)":[15],"receive":[16],"natural":[17],"language":[18],"descriptions":[19,83],"of":[20,32,56,81,112,151],"their":[21,41,69,120],"surroundings":[22],"through":[23],"audible":[24],"text.":[25],"We":[26],"investigated":[27],"how":[28,36],"this":[29],"emerging":[30],"paradigm":[31],"assistance":[34],"transforms":[35],"PVI":[37],"perform":[38],"and":[39,54,61,79,87,110,116,127,144,155],"manage":[40],"daily":[42],"tasks.":[43],"Moving":[44],"beyond":[45],"basic":[46],"usability":[47],"assessments,":[48],"we":[49,97,136],"examined":[50],"both":[51,85,142],"the":[52,149],"capabilities":[53,122],"limitations":[55],"LMM-based":[57,95],"tools":[58],"in":[59],"personal":[60],"social":[62,88,113],"contexts,":[63,114],"while":[64],"exploring":[65],"design":[66,138],"implications":[67],"for":[68,140],"future":[70],"development.":[71],"Through":[72],"interviews":[73],"14":[75],"visually":[76],"impaired":[77],"users":[78],"analysis":[80],"image":[82],"from":[84,108],"participants":[86],"media":[89],"using":[90],"Be":[91],"My":[92],"AI":[93],"(an":[94],"application),":[96],"identified":[98],"two":[99],"key":[100],"limitations.":[101],"First,":[102],"these":[103,134],"systems'":[104],"context":[105],"awareness":[106],"suffers":[107],"hallucinations":[109],"misinterpretations":[111],"styles,":[115],"human":[117],"identities.":[118],"Second,":[119],"intent-oriented":[121],"often":[123],"fail":[124],"to":[125,148],"grasp":[126],"act":[128],"on":[129,133],"users'":[130],"intentions.":[131],"Based":[132],"findings,":[135],"propose":[137],"strategies":[139],"improving":[141],"human-AI":[143],"AI-AI":[145],"interactions,":[146],"contributing":[147],"development":[150],"more":[152],"effective,":[153],"interactive,":[154],"personalized":[156],"assistive":[157],"technologies.":[158]},"counts_by_year":[{"year":2026,"cited_by_count":6},{"year":2025,"cited_by_count":5}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
