{"id":"https://openalex.org/W7139965416","doi":"https://doi.org/10.48550/arxiv.2603.19005","title":"AgentDS Technical Report: Benchmarking the Future of Human-AI Collaboration in Domain-Specific Data Science","display_name":"AgentDS Technical Report: Benchmarking the Future of Human-AI Collaboration in Domain-Specific Data Science","publication_year":2026,"publication_date":"2026-03-19","ids":{"openalex":"https://openalex.org/W7139965416","doi":"https://doi.org/10.48550/arxiv.2603.19005"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.19005","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.19005","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.19005","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5025874786","display_name":"An Luo","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Luo, An","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130215857","display_name":"Jin Du","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Du, Jin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130235065","display_name":"Xun Xian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xian, Xun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080962911","display_name":"Robert Specht","orcid":"https://orcid.org/0000-0002-5949-9577"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Specht, Robert","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113555795","display_name":"Fangqiao Tian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tian, Fangqiao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082958363","display_name":"Ganghua Wang","orcid":"https://orcid.org/0000-0002-0888-167X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Ganghua","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070768111","display_name":"Xuan Bi","orcid":"https://orcid.org/0000-0002-4683-1411"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bi, Xuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130246076","display_name":"Charles Fleming","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fleming, Charles","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130245220","display_name":"Ashish Kundu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kundu, Ashish","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130236575","display_name":"Jayanth Srinivasa","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Srinivasa, Jayanth","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130246015","display_name":"Mingyi Hong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hong, Mingyi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130247981","display_name":"Rui Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Rui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077899199","display_name":"Tianxi Li","orcid":"https://orcid.org/0000-0003-4595-1777"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Tianxi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130235517","display_name":"Galin Jones","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jones, Galin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130230700","display_name":"Jie Ding","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ding, Jie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":15,"corresponding_author_ids":["https://openalex.org/A5025874786"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.17430000007152557,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.17430000007152557,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.11749999970197678,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.06520000100135803,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.8479999899864197},{"id":"https://openalex.org/keywords/competition","display_name":"Competition (biology)","score":0.6291000247001648},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5199999809265137},{"id":"https://openalex.org/keywords/automation","display_name":"Automation","score":0.517799973487854},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.4088999927043915},{"id":"https://openalex.org/keywords/crowdsourcing","display_name":"Crowdsourcing","score":0.3885999917984009},{"id":"https://openalex.org/keywords/human-intelligence","display_name":"Human intelligence","score":0.3617999851703644},{"id":"https://openalex.org/keywords/applications-of-artificial-intelligence","display_name":"Applications of artificial intelligence","score":0.3375999927520752}],"concepts":[{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.8479999899864197},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.6477000117301941},{"id":"https://openalex.org/C91306197","wikidata":"https://www.wikidata.org/wiki/Q45767","display_name":"Competition (biology)","level":2,"score":0.6291000247001648},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5418000221252441},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5199999809265137},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.517799973487854},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.4088999927043915},{"id":"https://openalex.org/C62230096","wikidata":"https://www.wikidata.org/wiki/Q275969","display_name":"Crowdsourcing","level":2,"score":0.3885999917984009},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.3725999891757965},{"id":"https://openalex.org/C105409693","wikidata":"https://www.wikidata.org/wiki/Q5937824","display_name":"Human intelligence","level":2,"score":0.3617999851703644},{"id":"https://openalex.org/C157170001","wikidata":"https://www.wikidata.org/wiki/Q4781507","display_name":"Applications of artificial intelligence","level":2,"score":0.3375999927520752},{"id":"https://openalex.org/C2780535194","wikidata":"https://www.wikidata.org/wiki/Q309901","display_name":"Open data","level":2,"score":0.326200008392334},{"id":"https://openalex.org/C199033989","wikidata":"https://www.wikidata.org/wiki/Q1318295","display_name":"Narrative","level":2,"score":0.31949999928474426},{"id":"https://openalex.org/C89057211","wikidata":"https://www.wikidata.org/wiki/Q432197","display_name":"Collective intelligence","level":2,"score":0.31439998745918274},{"id":"https://openalex.org/C184356942","wikidata":"https://www.wikidata.org/wiki/Q830382","display_name":"Best practice","level":2,"score":0.3003000020980835},{"id":"https://openalex.org/C196879817","wikidata":"https://www.wikidata.org/wiki/Q872685","display_name":"Data governance","level":4,"score":0.2874999940395355},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.2872999906539917},{"id":"https://openalex.org/C82578977","wikidata":"https://www.wikidata.org/wiki/Q16773055","display_name":"Data aggregator","level":3,"score":0.2865000069141388},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28519999980926514},{"id":"https://openalex.org/C2778149293","wikidata":"https://www.wikidata.org/wiki/Q309823","display_name":"Open science","level":2,"score":0.2581000030040741},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.2515000104904175}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.19005","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.19005","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.19005","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.19005","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Zero hunger","id":"https://metadata.un.org/sdg/2","score":0.45592668652534485}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Data":[0],"science":[1,32,53],"plays":[2],"a":[3,68],"critical":[4],"role":[5],"in":[6,18,56,82,172],"transforming":[7],"complex":[8],"data":[9,31,52,84,173],"into":[10],"actionable":[11],"insights":[12],"across":[13,91],"numerous":[14],"domains.":[15],"Recent":[16],"developments":[17],"large":[19],"language":[20],"models":[21],"(LLMs)":[22],"and":[23,55,70,78,100,111,121,164,190],"artificial":[24],"intelligence":[25],"(AI)":[26],"agents":[27,42,77,130],"have":[28],"significantly":[29],"automated":[30],"workflow.":[33],"However,":[34],"it":[35],"remains":[36],"unclear":[37],"to":[38,62,73],"what":[39],"extent":[40],"AI":[41,76,129,163],"can":[43],"match":[44],"the":[45,141,147,157,166,179,185],"performance":[46,81],"of":[47,88,143,159,169,182],"human":[48,59,170],"experts":[49],"on":[50],"domain-specific":[51,83,133],"tasks,":[54],"which":[57],"aspects":[58],"expertise":[60,171],"continues":[61],"provide":[63],"advantages.":[64],"We":[65,103],"introduce":[66],"AgentDS,":[67],"benchmark":[69],"competition":[71,107,144],"designed":[72],"evaluate":[74],"both":[75],"human-AI":[79,118,152],"collaboration":[80],"science.":[85],"AgentDS":[86,186],"consists":[87],"17":[89],"challenges":[90],"six":[92],"industries:":[93],"commerce,":[94],"food":[95],"production,":[96],"healthcare,":[97],"insurance,":[98],"manufacturing,":[99],"retail":[101],"banking.":[102],"conducted":[104],"an":[105],"open":[106,191],"involving":[108],"29":[109],"teams":[110],"80":[112],"participants,":[113,145],"enabling":[114],"systematic":[115],"comparison":[116],"between":[117],"collaborative":[119],"approaches":[120],"AI-only":[122,135],"baselines.":[123],"Our":[124],"results":[125],"show":[126],"that":[127],"current":[128],"struggle":[131],"with":[132],"reasoning.":[134],"baselines":[136],"perform":[137],"near":[138],"or":[139],"below":[140],"median":[142],"while":[146,175],"strongest":[148],"solutions":[149],"arise":[150],"from":[151],"collaboration.":[153],"These":[154],"findings":[155],"challenge":[156],"narrative":[158],"complete":[160],"automation":[161],"by":[162],"underscore":[165],"enduring":[167],"importance":[168],"science,":[174],"illuminating":[176],"directions":[177],"for":[178],"next":[180],"generation":[181],"AI.":[183],"Visit":[184],"website":[187],"here:":[188,194],"https://agentds.org/":[189],"source":[192],"datasets":[193],"https://huggingface.co/datasets/lainmn/AgentDS":[195],".":[196]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-03-21T00:00:00"}
