{"id":"https://openalex.org/W4403995758","doi":"https://doi.org/10.48550/arxiv.2410.14331","title":"ChartifyText: Automated Chart Generation from Data-Involved Texts via LLM","display_name":"ChartifyText: Automated Chart Generation from Data-Involved Texts via LLM","publication_year":2024,"publication_date":"2024-10-18","ids":{"openalex":"https://openalex.org/W4403995758","doi":"https://doi.org/10.48550/arxiv.2410.14331"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2410.14331","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2410.14331","pdf_url":"https://arxiv.org/pdf/2410.14331","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2410.14331","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040591596","display_name":"Songheng Zhang","orcid":"https://orcid.org/0000-0002-0191-220X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhang, Songheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107094040","display_name":"Lei Wang","orcid":"https://orcid.org/0000-0001-8085-2374"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Lei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007240808","display_name":"Toby Jia-Jun Li","orcid":"https://orcid.org/0000-0001-7902-7625"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Toby Jia-Jun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039231102","display_name":"Qiaomu Shen","orcid":"https://orcid.org/0000-0002-6510-0964"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Qiaomu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101488072","display_name":"Yixin Cao","orcid":"https://orcid.org/0000-0002-1632-7812"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Yixin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5045655558","display_name":"Yong Wang","orcid":"https://orcid.org/0000-0003-3489-7672"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yong","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5040591596"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9909999966621399,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9909999966621399,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13523","display_name":"Mathematics, Computing, and Information Processing","score":0.9846000075340271,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12377","display_name":"Digital Humanities and Scholarship","score":0.9491000175476074,"subfield":{"id":"https://openalex.org/subfields/1208","display_name":"Literature and Literary Theory"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/chart","display_name":"Chart","score":0.6237037181854248},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6037858128547668},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.41837966442108154},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3691549301147461},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3335462808609009},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.13140857219696045},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09682238101959229}],"concepts":[{"id":"https://openalex.org/C190812933","wikidata":"https://www.wikidata.org/wiki/Q28923","display_name":"Chart","level":2,"score":0.6237037181854248},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6037858128547668},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.41837966442108154},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3691549301147461},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3335462808609009},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.13140857219696045},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09682238101959229}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2410.14331","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2410.14331","pdf_url":"https://arxiv.org/pdf/2410.14331","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2410.14331","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2410.14331","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2410.14331","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2410.14331","pdf_url":"https://arxiv.org/pdf/2410.14331","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4403995758.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Text":[0],"documents":[1,186],"with":[2,160,192,201],"numerical":[3],"values":[4,144],"involved":[5],"are":[6,149],"widely":[7],"used":[8],"in":[9,77,213],"various":[10],"applications":[11],"such":[12,30],"as":[13],"scientific":[14],"research,":[15],"economy,":[16],"public":[17],"health":[18],"and":[19,33,55,73,80,115,145,164,173,196,209,217],"journalism.":[20],"However,":[21],"it":[22],"is":[23,60],"difficult":[24],"for":[25],"readers":[26,215],"to":[27,45,49,57,98,103,128,134,167],"quickly":[28],"interpret":[29],"data-involved":[31,101,184,222],"texts":[32,102,166],"gain":[34],"deep":[35],"insights.":[36,174],"To":[37],"fill":[38],"this":[39,42],"research":[40],"gap,":[41],"work":[43],"aims":[44],"automatically":[46],"generate":[47],"charts":[48,159],"accurately":[50,168],"convey":[51,169],"the":[52,130,170,178,207],"underlying":[53,171],"data":[54,76,113,121,139,143,172],"ideas":[56],"readers,":[58],"which":[59],"essentially":[61],"a":[62,88,197],"challenging":[63],"task.":[64],"The":[65,119,152,204],"challenges":[66],"originate":[67],"from":[68],"text":[69,78,185],"ambiguities,":[70],"intrinsic":[71],"sparsity":[72],"uncertainty":[74],"of":[75,108,180,211,221],"documents,":[79],"subjective":[81,147],"sentiment":[82],"differences.":[83],"Specifically,":[84],"we":[85],"propose":[86],"ChartifyText,":[87],"novel":[89],"fully-automated":[90],"approach":[91],"that":[92],"leverages":[93],"Large":[94],"Language":[95],"Models":[96],"(LLMs)":[97],"convert":[99],"complex":[100],"expressive":[104,116,153],"charts.":[105],"It":[106],"consists":[107],"two":[109],"major":[110],"modules:":[111],"tabular":[112,120],"inference":[114,122],"chart":[117,154],"generation.":[118],"module":[123,156],"employs":[124],"systematic":[125],"prompt":[126],"engineering":[127],"guide":[129],"LLM":[131],"(e.g.,":[132],"GPT-4)":[133],"infer":[135],"table":[136],"data,":[137],"where":[138],"ranges,":[140],"uncertainties,":[141],"missing":[142],"corresponding":[146],"sentiments":[148],"explicitly":[150],"considered.":[151],"generation":[155],"augments":[157],"standard":[158],"intuitive":[161],"visual":[162],"encodings":[163],"concise":[165],"We":[175],"extensively":[176],"evaluate":[177],"effectiveness":[179,210],"ChartifyText":[181,212],"on":[182],"real-world":[183],"through":[187],"case":[188],"studies,":[189],"in-depth":[190],"interviews":[191],"three":[193],"visualization":[194],"experts,":[195],"carefully-designed":[198],"user":[199],"study":[200],"15":[202],"participants.":[203],"results":[205],"demonstrate":[206],"usefulness":[208],"helping":[214],"efficiently":[216],"effectively":[218],"make":[219],"sense":[220],"texts.":[223]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
