{"id":"https://openalex.org/W7162454131","doi":"https://doi.org/10.1145/3788853.3803099","title":"ConDABench: Interactive Evaluation of Language Models for Data Analysis","display_name":"ConDABench: Interactive Evaluation of Language Models for Data Analysis","publication_year":2026,"publication_date":"2026-05-26","ids":{"openalex":"https://openalex.org/W7162454131","doi":"https://doi.org/10.1145/3788853.3803099"},"language":null,"primary_location":{"id":"doi:10.1145/3788853.3803099","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3788853.3803099","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Companion of the International Conference on Management of Data","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3788853.3803099","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5104212959","display_name":"Avik Dutta","orcid":null},"institutions":[{"id":"https://openalex.org/I4210124949","display_name":"Microsoft Research (India)","ror":"https://ror.org/02w7f3w92","country_code":"IN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210124949"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Avik Dutta","raw_affiliation_strings":["Microsoft, Bangalore, India"],"raw_orcid":"https://orcid.org/0000-0002-7939-0157","affiliations":[{"raw_affiliation_string":"Microsoft, Bangalore, India","institution_ids":["https://openalex.org/I4210124949"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107243985","display_name":"Priyanshu Gupta","orcid":"https://orcid.org/0000-0002-5599-5004"},"institutions":[{"id":"https://openalex.org/I4210124949","display_name":"Microsoft Research (India)","ror":"https://ror.org/02w7f3w92","country_code":"IN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210124949"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Priyanshu Gupta","raw_affiliation_strings":["Microsoft, Bangalore, India"],"raw_orcid":"https://orcid.org/0000-0002-5599-5004","affiliations":[{"raw_affiliation_string":"Microsoft, Bangalore, India","institution_ids":["https://openalex.org/I4210124949"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033668003","display_name":"Hosein Hasanbeig","orcid":null},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hosein Hasanbeig","raw_affiliation_strings":["Microsoft, Redmond, USA"],"raw_orcid":"https://orcid.org/0000-0002-1715-9830","affiliations":[{"raw_affiliation_string":"Microsoft, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137013447","display_name":"Rahul Pratap Singh","orcid":"https://orcid.org/0009-0005-5829-0797"},"institutions":[{"id":"https://openalex.org/I4210124949","display_name":"Microsoft Research (India)","ror":"https://ror.org/02w7f3w92","country_code":"IN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210124949"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Rahul Pratap Singh","raw_affiliation_strings":["Microsoft, Bangalore, India"],"raw_orcid":"https://orcid.org/0009-0005-5829-0797","affiliations":[{"raw_affiliation_string":"Microsoft, Bangalore, India","institution_ids":["https://openalex.org/I4210124949"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007975543","display_name":"Harshit Nigam","orcid":"https://orcid.org/0000-0001-7228-5429"},"institutions":[{"id":"https://openalex.org/I4210124949","display_name":"Microsoft Research (India)","ror":"https://ror.org/02w7f3w92","country_code":"IN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210124949"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Harshit Nigam","raw_affiliation_strings":["Microsoft, Bangalore, India"],"raw_orcid":"https://orcid.org/0009-0001-0962-3779","affiliations":[{"raw_affiliation_string":"Microsoft, Bangalore, India","institution_ids":["https://openalex.org/I4210124949"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011543162","display_name":"Sumit Gulwani","orcid":"https://orcid.org/0000-0002-9226-9634"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sumit Gulwani","raw_affiliation_strings":["Microsoft, Redmond, USA"],"raw_orcid":"https://orcid.org/0000-0002-9226-9634","affiliations":[{"raw_affiliation_string":"Microsoft, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000188805","display_name":"Arjun Radhakrishna","orcid":"https://orcid.org/0000-0002-5559-5932"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Arjun Radhakrishna","raw_affiliation_strings":["Microsoft, Redmond, USA"],"raw_orcid":"https://orcid.org/0000-0002-5559-5932","affiliations":[{"raw_affiliation_string":"Microsoft, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137043633","display_name":"Gustavo Soares","orcid":"https://orcid.org/0000-0002-8061-9000"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gustavo Soares","raw_affiliation_strings":["Microsoft, Redmond, USA"],"raw_orcid":"https://orcid.org/0000-0002-8061-9000","affiliations":[{"raw_affiliation_string":"Microsoft, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5137050774","display_name":"Ashish Tiwari","orcid":"https://orcid.org/0000-0002-5153-2686"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ashish Tiwari","raw_affiliation_strings":["Microsoft, Redmond, USA"],"raw_orcid":"https://orcid.org/0000-0002-5153-2686","affiliations":[{"raw_affiliation_string":"Microsoft, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.84676136,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"281","last_page":"292"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.10920000076293945,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.10920000076293945,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.09619999676942825,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.09300000220537186,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.32269999384880066},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.3215999901294708},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.30559998750686646},{"id":"https://openalex.org/keywords/modeling-language","display_name":"Modeling language","score":0.2791999876499176},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.2720000147819519}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6855999827384949},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.44020000100135803},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43220001459121704},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.32269999384880066},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3215999901294708},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.30559998750686646},{"id":"https://openalex.org/C179603123","wikidata":"https://www.wikidata.org/wiki/Q1941921","display_name":"Modeling language","level":3,"score":0.2791999876499176},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2720000147819519},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.26919999718666077},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.26019999384880066}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3788853.3803099","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3788853.3803099","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Companion of the International Conference on Management of Data","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3788853.3803099","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3788853.3803099","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Companion of the International Conference on Management of Data","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.4247643053531647,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W2099684934","https://openalex.org/W2108598243","https://openalex.org/W3156669901","https://openalex.org/W4210451781","https://openalex.org/W4324373918","https://openalex.org/W4386321380","https://openalex.org/W4389519254","https://openalex.org/W4400484844","https://openalex.org/W4402671584","https://openalex.org/W4402672009","https://openalex.org/W4402684077","https://openalex.org/W4404782852","https://openalex.org/W4404783547"],"related_works":[],"abstract_inverted_index":{"Real-world":[0],"data":[1,37,59,115],"analysis":[2,38,60,116],"tasks":[3,39,151],"often":[4],"come":[5],"with":[6],"under-specified":[7],"goals":[8],"and":[9,18,23,63,98],"unclean":[10],"data.":[11],"User":[12],"interaction":[13],"is":[14,158],"necessary":[15],"to":[16,26,111,164],"understand":[17],"disambiguate":[19],"a":[20,54,75],"user's":[21],"intent,":[22],"hence,":[24],"essential":[25],"solving":[27,141,150],"these":[28,43],"complex":[29,174],"tasks.":[30,176],"Existing":[31],"benchmarks":[32,62,81,129],"for":[33,49,56,78,104,161],"evaluating":[34,64],"LLMs":[35,126],"on":[36,67,118,127],"do":[40],"not":[41,146],"capture":[42],"complexities":[44],"or":[45],"provide":[46],"first-class":[47],"support":[48],"interactivity.":[50],"We":[51],"introduce":[52],"ConDABench,":[53],"framework":[55],"generating":[57,79],"conversational":[58,114],"(ConDA)":[61],"external":[65],"tools":[66,117],"the":[68,105,119,128,133],"generated":[69,94,120],"benchmarks.":[70],"ConDABench":[71,157],"consists":[72],"of":[73,124,136],"(a)":[74],"multi-agent":[76],"workflow":[77],"realistic":[80],"from":[82,87],"articles":[83],"describing":[84],"insights":[85],"gained":[86],"public":[88],"datasets,":[89],"(b)":[90],"1,420":[91],"ConDA":[92,121],"problems":[93],"using":[95],"this":[96],"workflow,":[97],"(c)":[99],"an":[100,159],"evaluation":[101],"harness":[102],"that,":[103],"first":[106],"time,":[107],"makes":[108],"it":[109],"possible":[110],"systematically":[112],"evaluate":[113],"problems.":[122],"Evaluation":[123],"state-of-the-art":[125],"reveals":[130],"that":[131,152,171],"while":[132],"new":[134],"generation":[135],"models":[137,170],"are":[138,145],"better":[139,148],"at":[140,149],"more":[142],"instances,":[143],"they":[144],"necessarily":[147],"require":[153],"sustained,":[154],"long-form":[155],"engagement.":[156],"avenue":[160],"model":[162],"builders":[163],"measure":[165],"progress":[166],"towards":[167],"truly":[168],"collaborative":[169],"can":[172],"complete":[173],"interactive":[175]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-27T00:00:00"}
