{"id":"https://openalex.org/W4411570554","doi":"https://doi.org/10.32604/cmc.2025.065421","title":"Rethinking Chart Understanding Using Multimodal Large Language Models","display_name":"Rethinking Chart Understanding Using Multimodal Large Language Models","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4411570554","doi":"https://doi.org/10.32604/cmc.2025.065421"},"language":"en","primary_location":{"id":"doi:10.32604/cmc.2025.065421","is_oa":true,"landing_page_url":"https://doi.org/10.32604/cmc.2025.065421","pdf_url":null,"source":{"id":"https://openalex.org/S4210191605","display_name":"Computers, materials & continua/Computers, materials & continua (Print)","issn_l":"1546-2218","issn":["1546-2218","1546-2226"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers, Materials &amp; Continua","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.32604/cmc.2025.065421","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Andreea-Maria Tanas\u0103","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Andreea-Maria Tanas\u0103","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5035700125","display_name":"Simona\u2010Vasilica Oprea","orcid":"https://orcid.org/0000-0002-9005-5181"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Simona-Vasilica Oprea","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.2283,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.89272342,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"84","issue":"2","first_page":"2905","last_page":"2933"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9853000044822693,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9853000044822693,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9264000058174133,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6055211424827576},{"id":"https://openalex.org/keywords/chart","display_name":"Chart","score":0.5551712512969971},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.42911091446876526},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.3656831979751587},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.34711965918540955},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.1268385946750641},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09809136390686035},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.0827724039554596}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6055211424827576},{"id":"https://openalex.org/C190812933","wikidata":"https://www.wikidata.org/wiki/Q28923","display_name":"Chart","level":2,"score":0.5551712512969971},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.42911091446876526},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.3656831979751587},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34711965918540955},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.1268385946750641},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09809136390686035},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0827724039554596}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.32604/cmc.2025.065421","is_oa":true,"landing_page_url":"https://doi.org/10.32604/cmc.2025.065421","pdf_url":null,"source":{"id":"https://openalex.org/S4210191605","display_name":"Computers, materials & continua/Computers, materials & continua (Print)","issn_l":"1546-2218","issn":["1546-2218","1546-2226"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers, Materials &amp; Continua","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.32604/cmc.2025.065421","is_oa":true,"landing_page_url":"https://doi.org/10.32604/cmc.2025.065421","pdf_url":null,"source":{"id":"https://openalex.org/S4210191605","display_name":"Computers, materials & continua/Computers, materials & continua (Print)","issn_l":"1546-2218","issn":["1546-2218","1546-2226"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers, Materials &amp; Continua","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W3137120173","https://openalex.org/W3201302554","https://openalex.org/W4385194816","https://openalex.org/W4385990910","https://openalex.org/W4386526950","https://openalex.org/W4390619700","https://openalex.org/W4391596770","https://openalex.org/W4391876619","https://openalex.org/W4392172801","https://openalex.org/W4392947532"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Extracting":[0],"data":[1,184,323],"from":[2,104,148,268],"visually":[3],"rich":[4],"documents":[5,150,272],"and":[6,30,61,151,175,186,210,221,235,309,325],"charts":[7,262],"using":[8,91],"traditional":[9,167],"methods":[10,181],"that":[11],"rely":[12],"on":[13],"OCR-based":[14,168],"parsing":[15,97,266],"poses":[16],"multiple":[17],"challenges,":[18],"including":[19],"layout":[20],"complexity":[21],"in":[22,26,170,182,260,319],"unstructured":[23],"formats,":[24,199],"limitations":[25,165],"recognizing":[27],"visual":[28,112,171,286],"elements,":[29],"the":[31,37,70,73,102,105,119,123,155,158,164,177,204,211,224,231,236,248],"correlation":[32],"between":[33],"different":[34,254,306],"parts":[35],"of":[36,72,85,139,157,166,179,192,206,214,250,321],"documents,":[38],"as":[39,41,93,263],"well":[40],"domain-specific":[42],"semantics.":[43],"Simply":[44],"extracting":[45],"text":[46],"is":[47,115,297],"not":[48],"sufficient;":[49],"advanced":[50,302],"reasoning":[51,187,326],"capabilities":[52],"are":[53],"proving":[54],"to":[55,58,68,78,117,135,203,276,310],"be":[56],"essential":[57],"analyze":[59],"content":[60,156],"answer":[62,80,136],"questions":[63,81,140],"accurately.":[64],"This":[65,295],"paper":[66],"aims":[67],"evaluate":[69],"ability":[71],"Large":[74],"Language":[75],"Models":[76],"(LLMs)":[77],"correctly":[79],"about":[82],"various":[83],"types":[84],"charts,":[86],"comparing":[87,257],"their":[88,258,277],"performance":[89,249],"when":[90],"images":[92,103,146,264],"input":[94,198,255,307],"versus":[95,265],"directly":[96,153,267],"PDF":[98,149,269],"files.":[99],"To":[100],"retrieve":[101],"PDF,":[106],"ColPali,":[107],"a":[108,137],"model":[109],"leveraging":[110],"state-of-the-art":[111],"language":[113],"models,":[114],"used":[116,134],"identify":[118],"relevant":[120],"page":[121],"containing":[122],"appropriate":[124],"chart":[125,193,207,317],"for":[126,292],"each":[127],"question.":[128],"Google\u2019s":[129],"Gemini":[130],"multimodal":[131,180,215,251,278],"models":[132,303],"were":[133,273],"set":[138],"through":[141],"two":[142,219],"approaches:":[143],"1)":[144],"processing":[145,261],"derived":[147],"2)":[152],"utilizing":[154],"same":[159],"PDFs.":[160],"Our":[161],"findings":[162],"underscore":[163],"approaches":[169],"document":[172,216],"understanding":[173,208],"(VrDU)":[174],"demonstrate":[176],"advantages":[178],"both":[183],"extraction":[185,324],"tasks.":[188],"Through":[189],"structured":[190],"benchmarking":[191],"question":[194],"answering":[195],"(CQA)":[196],"across":[197,253],"our":[200],"work":[201],"contributes":[202],"advancement":[205],"(CU)":[209],"broader":[212],"field":[213],"analysis.":[217],"Using":[218],"diverse":[220],"information-rich":[222],"sources:":[223],"World":[225,232],"Health":[226,233],"Statistics":[227],"2024":[228,241],"report":[229],"by":[230,242],"Organisation":[234],"Global":[237],"Banking":[238],"Annual":[239],"Review":[240],"McKinsey":[243],"&":[244],"Company,":[245],"we":[246],"examine":[247],"LLMs":[252],"modalities,":[256],"effectiveness":[259],"content.":[270],"These":[271],"selected":[274],"due":[275],"nature,":[279],"combining":[280],"dense":[281],"textual":[282],"analysis":[283],"with":[284,305],"varied":[285],"representations,":[287],"thus":[288],"presenting":[289],"realistic":[290],"challenges":[291],"vision-language":[293],"models.":[294],"comparison":[296],"aimed":[298],"at":[299],"assessing":[300],"how":[301],"perform":[304],"formats":[308],"determine":[311],"if":[312],"an":[313],"image-based":[314],"approach":[315],"enhances":[316],"comprehension":[318],"terms":[320],"accurate":[322],"capabilities.":[327]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
