{"id":"https://openalex.org/W7147548920","doi":"https://doi.org/10.48550/arxiv.2603.27064","title":"ChartNet: A Million-Scale, High-Quality Multimodal Dataset for Robust Chart Understanding","display_name":"ChartNet: A Million-Scale, High-Quality Multimodal Dataset for Robust Chart Understanding","publication_year":2026,"publication_date":"2026-03-28","ids":{"openalex":"https://openalex.org/W7147548920","doi":"https://doi.org/10.48550/arxiv.2603.27064"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.27064","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27064","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.27064","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132634882","display_name":"Jovana Kondic","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kondic, Jovana","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132596434","display_name":"Pengyuan Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Pengyuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103960169","display_name":"Dhiraj Joshi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Joshi, Dhiraj","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132617758","display_name":"Isaac Sanchez","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sanchez, Isaac","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130241064","display_name":"Ben Wiesel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wiesel, Ben","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026008142","display_name":"Shafiq Abedin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abedin, Shafiq","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012181086","display_name":"Amit Alfassy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alfassy, Amit","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132567256","display_name":"Eli Schwartz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schwartz, Eli","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132693891","display_name":"Daniel Caraballo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Caraballo, Daniel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024152018","display_name":"Yagmur Gizem Cinar","orcid":"https://orcid.org/0000-0002-1884-7993"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cinar, Yagmur Gizem","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084145402","display_name":"Florian Scheidegger","orcid":"https://orcid.org/0000-0003-0430-3634"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Scheidegger, Florian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065499398","display_name":"Steven Ross","orcid":"https://orcid.org/0000-0002-2533-9946"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ross, Steven I.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043572512","display_name":"Daniel Karl I. Weidele","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Weidele, Daniel Karl I.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132628027","display_name":"Hang Hua","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hua, Hang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132670842","display_name":"Ekaterina Arutyunova","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Arutyunova, Ekaterina","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066997569","display_name":"Roei Herzig","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Herzig, Roei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069088584","display_name":"Zexue He","orcid":"https://orcid.org/0009-0001-9733-0545"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Zexue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132625338","display_name":"Zihan Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zihan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127795746","display_name":"Xinyue Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Xinyue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132597978","display_name":"Yunfei Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Yunfei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132684268","display_name":"Sicong Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Sicong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132600247","display_name":"Minghao Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Minghao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101370331","display_name":"Qunshu Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Qunshu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024778597","display_name":"Peter Staar","orcid":"https://orcid.org/0000-0002-8088-0823"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Staar, Peter","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023268703","display_name":"Luis Lastras","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lastras, Luis","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021257546","display_name":"Aude Oliva","orcid":"https://orcid.org/0000-0002-6920-914X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oliva, Aude","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5132573487","display_name":"Rogerio Feris","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Feris, Rogerio","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":27,"corresponding_author_ids":["https://openalex.org/A5132634882"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.6155999898910522,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.6155999898910522,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.16910000145435333,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.03849999979138374,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/chart","display_name":"Chart","score":0.77920001745224},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.61080002784729},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.5260000228881836},{"id":"https://openalex.org/keywords/interpretation","display_name":"Interpretation (philosophy)","score":0.3743000030517578},{"id":"https://openalex.org/keywords/data-visualization","display_name":"Data visualization","score":0.3734999895095825},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.3488999903202057},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.328900009393692},{"id":"https://openalex.org/keywords/flow-chart","display_name":"Flow chart","score":0.32260000705718994}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8102999925613403},{"id":"https://openalex.org/C190812933","wikidata":"https://www.wikidata.org/wiki/Q28923","display_name":"Chart","level":2,"score":0.77920001745224},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.61080002784729},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.5260000228881836},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5069000124931335},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4902999997138977},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4108000099658966},{"id":"https://openalex.org/C527412718","wikidata":"https://www.wikidata.org/wiki/Q855395","display_name":"Interpretation (philosophy)","level":2,"score":0.3743000030517578},{"id":"https://openalex.org/C172367668","wikidata":"https://www.wikidata.org/wiki/Q6504956","display_name":"Data visualization","level":3,"score":0.3734999895095825},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.3488999903202057},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.328900009393692},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.32739999890327454},{"id":"https://openalex.org/C2984431290","wikidata":"https://www.wikidata.org/wiki/Q185092","display_name":"Flow chart","level":2,"score":0.32260000705718994},{"id":"https://openalex.org/C196985124","wikidata":"https://www.wikidata.org/wiki/Q1369242","display_name":"Control chart","level":3,"score":0.2971000075340271},{"id":"https://openalex.org/C138958017","wikidata":"https://www.wikidata.org/wiki/Q190087","display_name":"Data type","level":2,"score":0.2946999967098236},{"id":"https://openalex.org/C205208641","wikidata":"https://www.wikidata.org/wiki/Q273404","display_name":"Pie chart","level":2,"score":0.29170000553131104},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2842000126838684},{"id":"https://openalex.org/C2780878386","wikidata":"https://www.wikidata.org/wiki/Q1659648","display_name":"Visual language","level":2,"score":0.28200000524520874},{"id":"https://openalex.org/C2780977526","wikidata":"https://www.wikidata.org/wiki/Q42417149","display_name":"Data exploration","level":3,"score":0.2775000035762787},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.27000001072883606},{"id":"https://openalex.org/C27209215","wikidata":"https://www.wikidata.org/wiki/Q1192777","display_name":"Radar chart","level":2,"score":0.2637999951839447},{"id":"https://openalex.org/C56288433","wikidata":"https://www.wikidata.org/wiki/Q58673","display_name":"Data manipulation language","level":2,"score":0.25769999623298645},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.2556999921798706}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.27064","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27064","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.27064","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.27064","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Understanding":[0],"charts":[1],"requires":[2],"models":[3,23,159],"to":[4,36,49,153],"jointly":[5],"reason":[6],"over":[7],"geometric":[8],"visual":[9,117],"patterns,":[10],"structured":[11],"numerical":[12],"data,":[13,105,107],"and":[14,40,60,81,109,121,162],"natural":[15,78],"language":[16,79],"--":[17],"a":[18,30,44,112],"capability":[19],"where":[20],"current":[21],"vision-language":[22],"(VLMs)":[24],"remain":[25],"limited.":[26],"We":[27],"introduce":[28],"ChartNet,":[29],"high-quality,":[31],"million-scale":[32],"multimodal":[33,141],"dataset":[34,147,170],"designed":[35],"advance":[37],"chart":[38,54,58,74,95,124],"interpretation":[39],"reasoning.":[41],"ChartNet":[42,97,128,151],"leverages":[43],"novel":[45],"code-guided":[46],"synthesis":[47],"pipeline":[48,115],"generate":[50],"1.5":[51],"million":[52],"diverse":[53],"samples":[55],"spanning":[56],"24":[57],"types":[59],"6":[61],"plotting":[62,71],"libraries.":[63],"Each":[64],"sample":[65],"consists":[66],"of":[67,94,148,157],"five":[68],"aligned":[69],"components:":[70],"code,":[72],"rendered":[73],"image,":[75],"data":[76,166],"table,":[77],"summary,":[80],"question-answering":[82],"with":[83,160],"reasoning,":[84],"providing":[85],"fine-grained":[86],"cross-modal":[87],"alignment.":[88],"To":[89],"capture":[90],"the":[91,144,155],"full":[92],"spectrum":[93],"comprehension,":[96],"additionally":[98],"includes":[99],"specialized":[100],"subsets":[101],"encompassing":[102],"human":[103],"annotated":[104],"real-world":[106],"safety,":[108],"grounding.":[110],"Moreover,":[111],"rigorous":[113],"quality-filtering":[114],"ensures":[116],"fidelity,":[118],"semantic":[119],"accuracy,":[120],"diversity":[122],"across":[123,132],"representations.":[125],"Fine-tuning":[126],"on":[127],"consistently":[129],"improves":[130],"results":[131],"benchmarks,":[133],"demonstrating":[134],"its":[135,149],"utility":[136],"as":[137],"large-scale":[138],"supervision":[139],"for":[140,165],"models.":[142],"As":[143],"largest":[145],"open-source":[146],"kind,":[150],"aims":[152],"support":[154],"development":[156],"foundation":[158],"robust":[161],"generalizable":[163],"capabilities":[164],"visualization":[167],"understanding.":[168],"The":[169],"is":[171],"publicly":[172],"available":[173],"at":[174],"https://huggingface.co/datasets/ibm-granite/ChartNet":[175]},"counts_by_year":[],"updated_date":"2026-05-04T08:30:34.212998","created_date":"2026-04-02T00:00:00"}
