{"id":"https://openalex.org/W7134804671","doi":"https://doi.org/10.48550/arxiv.2603.08704","title":"Evaluating Financial Intelligence in Large Language Models: Benchmarking SuperInvesting AI with LLM Engines","display_name":"Evaluating Financial Intelligence in Large Language Models: Benchmarking SuperInvesting AI with LLM Engines","publication_year":2026,"publication_date":"2026-03-09","ids":{"openalex":"https://openalex.org/W7134804671","doi":"https://doi.org/10.48550/arxiv.2603.08704"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.08704","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128638392","display_name":"Akshay Gulati","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gulati, Akshay","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128681676","display_name":"Kanha Singhania","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Singhania, Kanha","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128665012","display_name":"Tushar Banga","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Banga, Tushar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128641463","display_name":"Parth Arora","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Arora, Parth","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128668630","display_name":"Anshul Verma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Verma, Anshul","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128682592","display_name":"Vaibhav Kumar Singh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Singh, Vaibhav Kumar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128638732","display_name":"Agyapal Digra","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Digra, Agyapal","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128678265","display_name":"Jayant Singh Bisht","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bisht, Jayant Singh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086589807","display_name":"Danish Sharma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sharma, Danish","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128676665","display_name":"Varun Singla","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Singla, Varun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5121392987","display_name":"Shubh Garg","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Garg, Shubh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11326","display_name":"Stock Market Forecasting Methods","score":0.7211999893188477,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11326","display_name":"Stock Market Forecasting Methods","score":0.7211999893188477,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.05660000070929527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.01889999955892563,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/perplexity","display_name":"Perplexity","score":0.6848000288009644},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.6165000200271606},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.44850000739097595},{"id":"https://openalex.org/keywords/equity","display_name":"Equity (law)","score":0.41830000281333923},{"id":"https://openalex.org/keywords/financial-modeling","display_name":"Financial modeling","score":0.37459999322891235},{"id":"https://openalex.org/keywords/data-collection","display_name":"Data collection","score":0.3617999851703644},{"id":"https://openalex.org/keywords/f1-score","display_name":"F1 score","score":0.35010001063346863},{"id":"https://openalex.org/keywords/aggregate","display_name":"Aggregate (composite)","score":0.3472000062465668}],"concepts":[{"id":"https://openalex.org/C100279451","wikidata":"https://www.wikidata.org/wiki/Q372193","display_name":"Perplexity","level":3,"score":0.6848000288009644},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.6165000200271606},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5976999998092651},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.44850000739097595},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4359999895095825},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.4251999855041504},{"id":"https://openalex.org/C199728807","wikidata":"https://www.wikidata.org/wiki/Q2578557","display_name":"Equity (law)","level":2,"score":0.41830000281333923},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.40950000286102295},{"id":"https://openalex.org/C23925645","wikidata":"https://www.wikidata.org/wiki/Q5449731","display_name":"Financial modeling","level":2,"score":0.37459999322891235},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.3617999851703644},{"id":"https://openalex.org/C148524875","wikidata":"https://www.wikidata.org/wiki/Q6975395","display_name":"F1 score","level":2,"score":0.35010001063346863},{"id":"https://openalex.org/C4679612","wikidata":"https://www.wikidata.org/wiki/Q866298","display_name":"Aggregate (composite)","level":2,"score":0.3472000062465668},{"id":"https://openalex.org/C27548731","wikidata":"https://www.wikidata.org/wiki/Q88272","display_name":"Investment (military)","level":3,"score":0.3409000039100647},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3336000144481659},{"id":"https://openalex.org/C2778058735","wikidata":"https://www.wikidata.org/wiki/Q4692253","display_name":"Aggregate data","level":2,"score":0.3260999917984009},{"id":"https://openalex.org/C98014903","wikidata":"https://www.wikidata.org/wiki/Q832161","display_name":"Financial ratio","level":2,"score":0.3230000138282776},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.31690001487731934},{"id":"https://openalex.org/C130731218","wikidata":"https://www.wikidata.org/wiki/Q1363554","display_name":"Financial analysis","level":2,"score":0.2919999957084656},{"id":"https://openalex.org/C17231256","wikidata":"https://www.wikidata.org/wiki/Q5156540","display_name":"Completeness (order theory)","level":2,"score":0.27140000462532043},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.26440000534057617},{"id":"https://openalex.org/C70179600","wikidata":"https://www.wikidata.org/wiki/Q1416547","display_name":"Financial plan","level":2,"score":0.259799987077713},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.25839999318122864},{"id":"https://openalex.org/C193221554","wikidata":"https://www.wikidata.org/wiki/Q5153664","display_name":"Commonsense reasoning","level":2,"score":0.2549000084400177}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.08704","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2603.08704","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.08704","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.08704","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1,159],"models":[2,160],"are":[3],"increasingly":[4],"used":[5],"for":[6,181],"financial":[7,17,40,74,155,169],"analysis":[8,41,75],"and":[9,54,66,110,148,164],"investment":[10,183],"research,":[11],"yet":[12],"systematic":[13],"evaluation":[14,35],"of":[15,71,108,115],"their":[16],"reasoning":[18,174],"capabilities":[19,42,175],"remains":[20],"limited.":[21],"In":[22],"this":[23,93],"work,":[24],"we":[25],"introduce":[26],"the":[27,98,111,120,151,177],"AI":[28,60],"Financial":[29],"Intelligence":[30],"Benchmark":[31],"(AFIB),":[32],"a":[33,69],"multi-dimensional":[34],"framework":[36],"designed":[37],"to":[38,139],"assess":[39],"across":[43,90],"five":[44,59],"dimensions:":[45],"factual":[46,105],"accuracy,":[47],"analytical":[48,146,173],"completeness,":[49],"data":[50,135,170],"recency,":[51],"model":[52],"consistency,":[53],"failure":[55],"patterns.":[56],"We":[57],"evaluate":[58],"systems:":[61],"GPT,":[62],"Gemini,":[63],"Perplexity,":[64],"Claude,":[65],"SuperInvesting,":[67],"using":[68],"dataset":[70],"95+":[72],"structured":[73,168],"questions":[76],"derived":[77],"from":[78],"real-world":[79],"equity":[80],"research":[81,184],"tasks.":[82],"The":[83],"results":[84,152],"reveal":[85],"substantial":[86],"differences":[87],"in":[88,157],"performance":[89,180],"models.":[91],"Within":[92],"benchmark":[94],"setting,":[95],"SuperInvesting":[96],"achieves":[97],"highest":[99,112],"aggregate":[100],"performance,":[101],"with":[102,172],"an":[103],"average":[104],"accuracy":[106],"score":[107,114],"8.96/10":[109],"completeness":[113],"56.65/70,":[116],"while":[117],"also":[118],"demonstrating":[119],"lowest":[121],"hallucination":[122],"rate":[123],"among":[124],"evaluated":[125],"systems.":[126],"Retrieval-oriented":[127],"systems":[128,165],"such":[129],"as":[130],"Perplexity":[131],"perform":[132],"strongly":[133],"on":[134],"recency":[136],"tasks":[137],"due":[138],"live":[140],"information":[141],"access":[142,171],"but":[143],"exhibit":[144],"weaker":[145],"synthesis":[147],"consistency.":[149],"Overall,":[150],"highlight":[153],"that":[154,166],"intelligence":[156],"large":[158],"is":[161],"inherently":[162],"multi-dimensional,":[163],"combine":[167],"provide":[176],"most":[178],"reliable":[179],"complex":[182],"workflows.":[185]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-11T00:00:00"}
