{"id":"https://openalex.org/W7163026506","doi":"https://doi.org/10.48550/arxiv.2605.31064","title":"Fighting Numerical Hallucinations via Data-centric Compilation for Online Financial QA","display_name":"Fighting Numerical Hallucinations via Data-centric Compilation for Online Financial QA","publication_year":2026,"publication_date":"2026-05-29","ids":{"openalex":"https://openalex.org/W7163026506","doi":"https://doi.org/10.48550/arxiv.2605.31064"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.31064","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.31064","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.31064","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137556795","display_name":"Hao Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Hao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137531874","display_name":"Xing Tang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Xing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016923469","display_name":"Qirui Liu","orcid":"https://orcid.org/0009-0008-8385-2490"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Qirui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137606684","display_name":"Weijie Shi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Weijie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137573519","display_name":"Shiwei Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Shiwei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137571759","display_name":"Fuyuan Lyu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lyu, Fuyuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137558081","display_name":"Weihong Luo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luo, Weihong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137569121","display_name":"Xiku Du","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Du, Xiku","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5083350101","display_name":"Xiuqiang He","orcid":"https://orcid.org/0000-0002-4115-8205"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Xiuqiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3828999996185303,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3828999996185303,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.09939999878406525,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11326","display_name":"Stock Market Forecasting Methods","score":0.04540000110864639,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/audit","display_name":"Audit","score":0.6891999840736389},{"id":"https://openalex.org/keywords/executable","display_name":"Executable","score":0.6579999923706055},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5241000056266785},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.5088000297546387},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.49390000104904175},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.48890000581741333},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4830999970436096},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.4575999975204468},{"id":"https://openalex.org/keywords/structuring","display_name":"Structuring","score":0.4526999890804291}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7211999893188477},{"id":"https://openalex.org/C199521495","wikidata":"https://www.wikidata.org/wiki/Q181487","display_name":"Audit","level":2,"score":0.6891999840736389},{"id":"https://openalex.org/C160145156","wikidata":"https://www.wikidata.org/wiki/Q778586","display_name":"Executable","level":2,"score":0.6579999923706055},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5241000056266785},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.5088000297546387},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.49390000104904175},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.48890000581741333},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4830999970436096},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.4575999975204468},{"id":"https://openalex.org/C2775945657","wikidata":"https://www.wikidata.org/wiki/Q381442","display_name":"Structuring","level":2,"score":0.4526999890804291},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.450300008058548},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42579999566078186},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3978999853134155},{"id":"https://openalex.org/C2780992000","wikidata":"https://www.wikidata.org/wiki/Q17016113","display_name":"Generator (circuit theory)","level":3,"score":0.3869999945163727},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.376800000667572},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.37310001254081726},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.3718000054359436},{"id":"https://openalex.org/C75291252","wikidata":"https://www.wikidata.org/wiki/Q1315756","display_name":"TRACE (psycholinguistics)","level":2,"score":0.366100013256073},{"id":"https://openalex.org/C193221554","wikidata":"https://www.wikidata.org/wiki/Q5153664","display_name":"Commonsense reasoning","level":2,"score":0.35850000381469727},{"id":"https://openalex.org/C202695956","wikidata":"https://www.wikidata.org/wiki/Q2669680","display_name":"Debriefing","level":2,"score":0.3546000123023987},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3425999879837036},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.3384999930858612},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.31299999356269836},{"id":"https://openalex.org/C2779458634","wikidata":"https://www.wikidata.org/wiki/Q24963715","display_name":"Debiasing","level":2,"score":0.3100000023841858},{"id":"https://openalex.org/C42525527","wikidata":"https://www.wikidata.org/wiki/Q1209955","display_name":"Formative assessment","level":2,"score":0.2913999855518341},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.28060001134872437},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2800999879837036},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.27790001034736633},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.2777000069618225},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2770000100135803},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.2766000032424927},{"id":"https://openalex.org/C102944935","wikidata":"https://www.wikidata.org/wiki/Q4953701","display_name":"Bracketing (phenomenology)","level":2,"score":0.27639999985694885},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.27230000495910645},{"id":"https://openalex.org/C105002631","wikidata":"https://www.wikidata.org/wiki/Q4833645","display_name":"Subject-matter expert","level":3,"score":0.271699994802475},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.2621999979019165}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.31064","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.31064","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.31064","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.31064","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"have":[4],"significantly":[5],"advanced":[6],"online":[7,192],"data":[8,115],"services,":[9],"particularly":[10],"in":[11,32,47,76,84,189],"the":[12,72,101,152],"domain":[13],"of":[14,138],"financial":[15,34,193],"question":[16],"answering":[17],"(FinQA).":[18],"However,":[19],"such":[20],"systems":[21],"remain":[22],"susceptible":[23],"to":[24,44,80,124],"numerical":[25,170],"reasoning":[26,163,171],"hallucinations,":[27],"which":[28,66,117],"critically":[29],"undermine":[30],"reliability":[31],"high-stakes":[33],"applications.":[35],"Although":[36],"retrieval-augmented":[37],"generation":[38],"(RAG)":[39],"has":[40],"been":[41],"widely":[42],"adopted":[43],"ground":[45],"responses":[46],"external":[48],"knowledge,":[49],"it":[50],"introduces":[51],"three":[52,110],"persistent":[53],"challenges:":[54],"noise":[55,123],"sensitivity,":[56],"calculation":[57],"fragility,":[58],"and":[59,96,142,145,157,182],"an":[60,85],"auditability":[61],"crisis.":[62],"Existing":[63],"model-centric":[64],"approaches,":[65],"primarily":[67],"focus":[68],"on":[69,178],"optimizing":[70],"either":[71],"retriever":[73],"or":[74],"generator":[75],"isolation,":[77],"still":[78],"struggle":[79],"address":[81],"these":[82],"issues":[83],"integrated":[86],"manner.":[87],"In":[88],"this":[89],"work,":[90],"we":[91],"pioneer":[92],"a":[93,98,132,147,190],"data-centric":[94],"paradigm":[95],"propose":[97],"novel":[99],"framework,":[100],"Data-centric":[102,133],"Reasoning":[103],"Compiler":[104],"(DCRC).":[105],"The":[106],"framework":[107,167,186],"operates":[108],"through":[109,187],"cohesive":[111],"phases:":[112],"(1)":[113],"adversarial":[114],"construction,":[116],"synthesizes":[118],"training":[119,129],"examples":[120],"with":[121],"controlled":[122],"teach":[125],"robustness;":[126],"(2)":[127],"multi-stage":[128],"that":[130],"cultivates":[131],"Structuring":[134],"Agent":[135],"(DSA)":[136],"capable":[137],"explicit":[139],"evidence":[140],"auditing":[141],"program":[143],"synthesis;":[144],"(3)":[146],"compile-and-execute":[148],"inference":[149],"process,":[150],"where":[151],"DSA":[153],"transforms":[154],"user":[155],"queries":[156],"retrieved":[158],"documents":[159],"into":[160],"verifiable,":[161],"executable":[162],"programs.":[164],"This":[165],"data-driven":[166],"ensures":[168],"faithful":[169],"by":[172],"design.":[173],"We":[174],"conduct":[175],"extensive":[176],"experiments":[177],"established":[179],"offline":[180],"benchmarks":[181],"further":[183],"validate":[184],"our":[185],"deployment":[188],"real-world":[191],"QA":[194],"system.":[195]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-06-02T00:00:00"}
