{"id":"https://openalex.org/W7131824587","doi":"https://doi.org/10.48550/arxiv.2602.23286","title":"SPARTA: Scalable and Principled Benchmark of Tree-Structured Multi-hop QA over Text and Tables","display_name":"SPARTA: Scalable and Principled Benchmark of Tree-Structured Multi-hop QA over Text and Tables","publication_year":2026,"publication_date":"2026-02-26","ids":{"openalex":"https://openalex.org/W7131824587","doi":"https://doi.org/10.48550/arxiv.2602.23286"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.23286","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5121301448","display_name":"Sungho Park","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Park, Sungho","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127265839","display_name":"Jueun Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Jueun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5127199787","display_name":"Wook-Shin Han","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Wook-Shin","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5121301448"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.22789999842643738,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.22789999842643738,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.1517000049352646,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.09529999643564224,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6100000143051147},{"id":"https://openalex.org/keywords/sql","display_name":"SQL","score":0.5534999966621399},{"id":"https://openalex.org/keywords/tuple","display_name":"Tuple","score":0.5138999819755554},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5101000070571899},{"id":"https://openalex.org/keywords/oracle","display_name":"Oracle","score":0.49729999899864197},{"id":"https://openalex.org/keywords/executable","display_name":"Executable","score":0.45649999380111694},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.4523000121116638},{"id":"https://openalex.org/keywords/row","display_name":"Row","score":0.4072999954223633},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4004000127315521}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8385000228881836},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6100000143051147},{"id":"https://openalex.org/C510870499","wikidata":"https://www.wikidata.org/wiki/Q47607","display_name":"SQL","level":2,"score":0.5534999966621399},{"id":"https://openalex.org/C118930307","wikidata":"https://www.wikidata.org/wiki/Q600590","display_name":"Tuple","level":2,"score":0.5138999819755554},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5101000070571899},{"id":"https://openalex.org/C55166926","wikidata":"https://www.wikidata.org/wiki/Q2892946","display_name":"Oracle","level":2,"score":0.49729999899864197},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4652000069618225},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.4627000093460083},{"id":"https://openalex.org/C160145156","wikidata":"https://www.wikidata.org/wiki/Q778586","display_name":"Executable","level":2,"score":0.45649999380111694},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.4523000121116638},{"id":"https://openalex.org/C135598885","wikidata":"https://www.wikidata.org/wiki/Q1366302","display_name":"Row","level":2,"score":0.4072999954223633},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4004000127315521},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.39969998598098755},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.3813999891281128},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.36059999465942383},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.35899999737739563},{"id":"https://openalex.org/C171268870","wikidata":"https://www.wikidata.org/wiki/Q1486676","display_name":"GRASP","level":2,"score":0.35420000553131104},{"id":"https://openalex.org/C168065819","wikidata":"https://www.wikidata.org/wiki/Q845566","display_name":"Debugging","level":2,"score":0.34630000591278076},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.33070001006126404},{"id":"https://openalex.org/C2777026412","wikidata":"https://www.wikidata.org/wiki/Q2684591","display_name":"Statement (logic)","level":2,"score":0.32839998602867126},{"id":"https://openalex.org/C192028432","wikidata":"https://www.wikidata.org/wiki/Q845739","display_name":"Query language","level":2,"score":0.3273000121116638},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.3215999901294708},{"id":"https://openalex.org/C67388219","wikidata":"https://www.wikidata.org/wiki/Q207440","display_name":"Hash table","level":3,"score":0.3190999925136566},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.2897000014781952},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.28769999742507935},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.28700000047683716},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28060001134872437},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2800999879837036},{"id":"https://openalex.org/C176809094","wikidata":"https://www.wikidata.org/wiki/Q15401496","display_name":"Traverse","level":2,"score":0.2761000096797943},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.272599995136261},{"id":"https://openalex.org/C99138194","wikidata":"https://www.wikidata.org/wiki/Q183427","display_name":"Hash function","level":2,"score":0.2587999999523163},{"id":"https://openalex.org/C8797682","wikidata":"https://www.wikidata.org/wiki/Q2115","display_name":"XML","level":2,"score":0.2549999952316284}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.23286","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.23286","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.23286","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.23286","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"score":0.657255232334137,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Real-world":[0],"Table-Text":[1,74],"question":[2],"answering":[3],"(QA)":[4],"tasks":[5],"require":[6],"models":[7,204,238],"that":[8,43,70,135,142,163,205],"can":[9],"reason":[10],"across":[11,197],"long":[12],"text":[13,198],"and":[14,20,35,39,141,168,193,199,236],"source":[15,102],"tables,":[16],"traversing":[17],"multiple":[18],"hops":[19,49],"executing":[21],"complex":[22],"operations":[23,58],"such":[24],"as":[25],"aggregation.":[26],"Yet":[27],"existing":[28],"benchmarks":[29,76],"are":[30,109,239],"small,":[31],"manually":[32],"curated":[33],"-":[34,38],"therefore":[36],"error-prone":[37],"contain":[40],"shallow":[41],"questions":[42],"seldom":[44],"demand":[45],"more":[46,220],"than":[47,221],"two":[48,152],"or":[50,54,212],"invoke":[51],"aggregations,":[52,191],"grouping,":[53,192],"other":[55],"advanced":[56],"analytical":[57],"expressible":[59],"in":[60,228],"natural-language":[61],"queries.":[62],"We":[63],"present":[64],"SPARTA,":[65,202],"an":[66],"end-to-end":[67],"construction":[68,234],"framework":[69,92],"automatically":[71,112],"generates":[72],"large-scale":[73],"QA":[75],"with":[77,104],"lightweight":[78],"human":[79],"validation,":[80],"requiring":[81],"only":[82],"one":[83],"quarter":[84],"of":[85,89,125,177,186],"the":[86,115,129,178],"annotation":[87],"time":[88],"HybridQA.":[90],"The":[91,181],"first":[93],"constructs":[94],"a":[95,146,165],"reference":[96],"fact":[97],"database":[98],"by":[99,219],"enriching":[100],"each":[101],"table":[103],"grounding":[105],"tables":[106],"whose":[107,123],"tuples":[108],"atomic":[110],"facts":[111],"extracted":[113],"from":[114],"accompanying":[116],"unstructured":[117],"passages,":[118],"then":[119],"synthesizes":[120],"nested":[121,126],"queries":[122],"number":[124],"predicates":[127],"matches":[128],"desired":[130],"hop":[131],"count.":[132],"To":[133],"ensure":[134],"every":[136],"SQL":[137],"statement":[138],"is":[139],"executable":[140],"its":[143],"verbalization":[144],"yields":[145],"fluent,":[147],"human-sounding":[148],"question,":[149],"we":[150],"propose":[151],"novel":[153],"techniques:":[154],"provenance-based":[155],"refinement,":[156],"which":[157,171],"rewrites":[158],"any":[159],"syntactically":[160],"valid":[161],"query":[162,179],"returns":[164],"non-empty":[166],"result,":[167],"realistic-structure":[169],"enforcement,":[170],"confines":[172],"generation":[173],"to":[174],"post-order":[175],"traversals":[176],"graph.":[180],"resulting":[182],"pipeline":[183],"produces":[184],"thousands":[185],"high-fidelity":[187],"question-answer":[188],"pairs":[189],"covering":[190],"deep":[194],"multi-hop":[195],"reasoning":[196],"tables.":[200],"On":[201],"state-of-the-art":[203],"reach":[206],"over":[207,213],"70":[208],"F1":[209,215,223],"on":[210,216],"HybridQA":[211],"50":[214],"OTT-QA":[217],"drop":[218],"30":[222],"points,":[224],"exposing":[225],"fundamental":[226],"weaknesses":[227],"current":[229],"cross-modal":[230],"reasoning.":[231],"Our":[232],"benchmark,":[233],"code,":[235],"baseline":[237],"available":[240],"at":[241],"https://github.com/pshlego/SPARTA/tree/main.":[242]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-28T00:00:00"}
