{"id":"https://openalex.org/W7139949892","doi":"https://doi.org/10.1016/j.procs.2026.01.026","title":"AI Reading Comprehension Assistants Integrating Visual Data for Enhanced Human Understanding","display_name":"AI Reading Comprehension Assistants Integrating Visual Data for Enhanced Human Understanding","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7139949892","doi":"https://doi.org/10.1016/j.procs.2026.01.026"},"language":"en","primary_location":{"id":"doi:10.1016/j.procs.2026.01.026","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.026","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1016/j.procs.2026.01.026","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130219783","display_name":"Anupa Sinha","orcid":null},"institutions":[{"id":"https://openalex.org/I2800614057","display_name":"Kalinga University","ror":"https://ror.org/03afg5j45","country_code":"IN","type":"education","lineage":["https://openalex.org/I2800614057"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Anupa Sinha","raw_affiliation_strings":["Kalinga University, Naya Raipur, Chhattisgarh, India"],"affiliations":[{"raw_affiliation_string":"Kalinga University, Naya Raipur, Chhattisgarh, India","institution_ids":["https://openalex.org/I2800614057"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5121733784","display_name":"Roohee Khan","orcid":null},"institutions":[{"id":"https://openalex.org/I2800614057","display_name":"Kalinga University","ror":"https://ror.org/03afg5j45","country_code":"IN","type":"education","lineage":["https://openalex.org/I2800614057"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Roohee Khan","raw_affiliation_strings":["Kalinga University, Naya Raipur, Chhattisgarh, India"],"affiliations":[{"raw_affiliation_string":"Kalinga University, Naya Raipur, Chhattisgarh, India","institution_ids":["https://openalex.org/I2800614057"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5130219783"],"corresponding_institution_ids":["https://openalex.org/I2800614057"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.95238795,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":"275","issue":null,"first_page":"208","last_page":"216"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.40880000591278076,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.40880000591278076,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.023900000378489494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14394","display_name":"Cognitive Science and Education Research","score":0.021299999207258224,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reading","display_name":"Reading (process)","score":0.4991999864578247},{"id":"https://openalex.org/keywords/comprehension","display_name":"Comprehension","score":0.4982999861240387},{"id":"https://openalex.org/keywords/reading-comprehension","display_name":"Reading comprehension","score":0.44670000672340393},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.3564000129699707},{"id":"https://openalex.org/keywords/visual-language","display_name":"Visual language","score":0.33309999108314514}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8729000091552734},{"id":"https://openalex.org/C554936623","wikidata":"https://www.wikidata.org/wiki/Q199657","display_name":"Reading (process)","level":2,"score":0.4991999864578247},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.4982999861240387},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.48809999227523804},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45649999380111694},{"id":"https://openalex.org/C2778780117","wikidata":"https://www.wikidata.org/wiki/Q3269423","display_name":"Reading comprehension","level":3,"score":0.44670000672340393},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.43220001459121704},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.3564000129699707},{"id":"https://openalex.org/C2780878386","wikidata":"https://www.wikidata.org/wiki/Q1659648","display_name":"Visual language","level":2,"score":0.33309999108314514},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.2831999957561493},{"id":"https://openalex.org/C172367668","wikidata":"https://www.wikidata.org/wiki/Q6504956","display_name":"Data visualization","level":3,"score":0.2809000015258789}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1016/j.procs.2026.01.026","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.026","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1016/j.procs.2026.01.026","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2026.01.026","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.6501502394676208}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W4385067602","https://openalex.org/W4386982033","https://openalex.org/W4387059617","https://openalex.org/W4387221236","https://openalex.org/W4388494745","https://openalex.org/W4390231631","https://openalex.org/W4390506533","https://openalex.org/W4390686696","https://openalex.org/W4390974150","https://openalex.org/W4390974852","https://openalex.org/W4390974969","https://openalex.org/W4391545757","https://openalex.org/W4392234077","https://openalex.org/W4392902463","https://openalex.org/W4393618909","https://openalex.org/W4394850884","https://openalex.org/W4398198142","https://openalex.org/W4400205824","https://openalex.org/W4401453382","https://openalex.org/W4402274395","https://openalex.org/W4403446022","https://openalex.org/W4404284060","https://openalex.org/W4404300986","https://openalex.org/W4405271521","https://openalex.org/W4410382551","https://openalex.org/W4410428252","https://openalex.org/W4410616178","https://openalex.org/W4410639293","https://openalex.org/W4410949762","https://openalex.org/W4416288646"],"related_works":[],"abstract_inverted_index":{"Reading":[0],"comprehension":[1,169,224,249,277],"systems":[2,278],"are":[3,26,69],"an":[4,101],"integral":[5],"area":[6],"of":[7,45,63,142,163,174,222,230,243],"artificial":[8],"intelligence":[9],"(AI)":[10],"as":[11,51,80],"it":[12,147],"supports":[13],"human":[14,61,231,256,261],"learning":[15],"and":[16,35,48,86,123,136,166,197,226,238,260,271],"information":[17],"processing.":[18],"Compared":[19],"to":[20,29,33,128,170,195,220,235,253,273],"traditional":[21,116],"AI":[22,102,117,275],"reading":[23,103,223,236,248,276],"tools":[24,118],"which":[25,159],"only":[27,106],"able":[28],"read":[30,107],"text":[31,109,122,175],"thanks":[32],"spelling":[34],"grammar":[36],"with":[37,97,176,192],"a":[38,57,90,111,139,149],"few":[39],"language":[40,168],"specific":[41,172],"rules,":[42],"the":[43,108,121,124,133,161,177,206,247,280],"inclusion":[44],"visual":[46,67,72,98,180,199,244],"graphics":[47],"data":[49,65,245],"such":[50,79],"charts,":[52],"graphs,":[53],"diagrams":[54],"etc.":[55],"forces":[56],"cognitive":[58],"shift":[59],"towards":[60],"processing":[62],"multimodal":[64,151,213,274],"where":[66],"signals":[68,200],"important.":[70],"This":[71],"element":[73],"can":[74,126],"be":[75],"crucial":[76],"within":[77,110,246],"domains":[78],"direct":[81],"healthcare":[82],"interaction,":[83],"educational":[84],"learning,":[85],"technical":[87],"documents":[88,96,237],"in":[89,233,251,279],"workplace.":[91],"Traditional":[92],"methods":[93],"will":[94,105,183,267],"separate":[95],"components,":[99],"while":[100],"tool":[104],"document.":[112],"The":[113,208],"way":[114],"that":[115,201,216],"process":[119,250],"both":[120],"image":[125],"lead":[127],"incomplete":[129],"mental":[130],"processes":[131],"on":[132,211],"user\u2019s":[134],"behalf":[135],"this":[137,145,185],"means":[138],"diminished":[140],"level":[141],"interpretability.":[143],"In":[144],"regard,":[146],"proposes":[148],"new":[150],"framework":[152],"called":[153],"Visual-Integrated":[154],"Semantic":[155],"Textual":[156],"Assistant":[157],"(VISTA),":[158],"takes":[160],"strengths":[162],"computer":[164],"vision":[165],"natural":[167],"document":[171],"passages":[173],"most":[178],"relevant":[179],"indicators.":[181],"VISTA":[182,217,240,266],"perform":[184],"document-level":[186],"semantic":[187,190],"alignment":[188],"using":[189],"anchoring":[191],"cross-modal":[193],"attention":[194],"frame":[196],"contextualize":[198],"demonstrate":[202],"meaning":[203],"provided":[204],"by":[205],"text.":[207],"experimental":[209],"evaluations":[210],"benchmark":[212],"datasets":[214],"showed":[215],"demonstrated":[218],"improvements":[219],"aspects":[221,242],"accuracy":[225],"more":[227],"critical":[228],"aspect":[229],"interpretability":[232],"regards":[234],"indications.":[239],"integrates":[241],"order":[252],"foster":[254],"increased":[255],"engagement,":[257],"better":[258,269],"memory,":[259],"decision":[262],"making,":[263],"we":[264],"believe":[265],"provide":[268],"usefulness":[270],"applicability":[272],"future.":[281]},"counts_by_year":[],"updated_date":"2026-03-22T06:25:25.174409","created_date":"2026-03-21T00:00:00"}
