{"id":"https://openalex.org/W7162579366","doi":"https://doi.org/10.48550/arxiv.2605.26340","title":"ScientistOne: Towards Human-Level Autonomous Research via Chain-of-Evidence","display_name":"ScientistOne: Towards Human-Level Autonomous Research via Chain-of-Evidence","publication_year":2026,"publication_date":"2026-05-25","ids":{"openalex":"https://openalex.org/W7162579366","doi":"https://doi.org/10.48550/arxiv.2605.26340"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.26340","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.26340","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.26340","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137179080","display_name":"Rui Meng","orcid":"https://orcid.org/0000-0002-6562-4012"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Meng, Rui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137151069","display_name":"Bhavana Dalvi Mishra","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mishra, Bhavana Dalvi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137128643","display_name":"Jiefeng Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Jiefeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102972645","display_name":"Chunliang Li","orcid":"https://orcid.org/0000-0002-5938-5510"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Chun-Liang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011797382","display_name":"Palash Goyal","orcid":"https://orcid.org/0000-0003-2455-2160"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Goyal, Palash","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137163005","display_name":"Mihir Parmar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Parmar, Mihir","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137185322","display_name":"Yiwen Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Yiwen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100566791","display_name":"Yale Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Yale","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087918973","display_name":"Rajarishi Sinha","orcid":"https://orcid.org/0000-0001-9157-674X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sinha, Rajarishi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137150783","display_name":"Parthasarathy Ranganathan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ranganathan, Parthasarathy","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103372430","display_name":"Burak G\u00f6kt\u00fcrk","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gokturk, Burak","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137087284","display_name":"Jinsung Yoon","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yoon, Jinsung","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137169530","display_name":"Tomas Pfister","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pfister, Tomas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":13,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.3529999852180481,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.3529999852180481,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.1128000020980835,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.08420000225305557,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hallucinating","display_name":"Hallucinating","score":0.7998999953269958},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.6294000148773193},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.5401999950408936},{"id":"https://openalex.org/keywords/audit","display_name":"Audit","score":0.5360999703407288},{"id":"https://openalex.org/keywords/collusion","display_name":"Collusion","score":0.43810001015663147},{"id":"https://openalex.org/keywords/artifact","display_name":"Artifact (error)","score":0.3269999921321869}],"concepts":[{"id":"https://openalex.org/C2911011789","wikidata":"https://www.wikidata.org/wiki/Q130741","display_name":"Hallucinating","level":2,"score":0.7998999953269958},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.6294000148773193},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5924999713897705},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.5401999950408936},{"id":"https://openalex.org/C199521495","wikidata":"https://www.wikidata.org/wiki/Q181487","display_name":"Audit","level":2,"score":0.5360999703407288},{"id":"https://openalex.org/C2781198186","wikidata":"https://www.wikidata.org/wiki/Q701521","display_name":"Collusion","level":2,"score":0.43810001015663147},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4205000102519989},{"id":"https://openalex.org/C2779010991","wikidata":"https://www.wikidata.org/wiki/Q2720909","display_name":"Artifact (error)","level":2,"score":0.3269999921321869},{"id":"https://openalex.org/C138268822","wikidata":"https://www.wikidata.org/wiki/Q1051925","display_name":"Resolution (logic)","level":2,"score":0.31690001487731934},{"id":"https://openalex.org/C106347477","wikidata":"https://www.wikidata.org/wiki/Q5384228","display_name":"Equating","level":3,"score":0.303600013256073},{"id":"https://openalex.org/C2778869765","wikidata":"https://www.wikidata.org/wiki/Q6028363","display_name":"Inefficiency","level":2,"score":0.2906999886035919},{"id":"https://openalex.org/C2780813799","wikidata":"https://www.wikidata.org/wiki/Q3274237","display_name":"Zero (linguistics)","level":2,"score":0.271699994802475},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2513999938964844}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.26340","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.26340","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.26340","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.26340","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.4904002547264099,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Autonomous":[0],"research":[1,58,109],"agents":[2],"produce":[3],"competitive":[4],"solutions":[5],"and":[6,23,71,91,106,135,153,184,192],"professional-looking":[7],"manuscripts,":[8],"yet":[9],"their":[10],"outputs":[11],"contain":[12],"verifiability":[13,41],"failures":[14],"undetectable":[15],"by":[16,64],"surface-level":[17],"evaluation:":[18],"fabricated":[19],"citations,":[20],"unreproducible":[21],"scores,":[22],"method":[24],"descriptions":[25],"that":[26,60],"diverge":[27],"from":[28,139],"the":[29,154],"implementation.":[30],"We":[31],"address":[32],"this":[33],"through":[34],"three":[35],"contributions.":[36],"First,":[37],"Chain-of-Evidence":[38],"(CoE),":[39],"a":[40,77],"framework":[42],"requiring":[43],"every":[44,111],"claim":[45],"to":[46,49,97,141,173],"be":[47],"traceable":[48],"its":[50],"evidence":[51,62],"source.":[52],"Second,":[53],"ScientistOne,":[54],"an":[55],"end-to-end":[56],"autonomous":[57],"system":[59],"maintains":[61],"chains":[63],"construction":[65],"throughout":[66],"literature":[67],"review,":[68],"solution":[69],"discovery,":[70],"paper":[72],"writing.":[73],"Third,":[74],"CoE":[75],"Audit,":[76],"post-hoc":[78],"audit":[79],"whose":[80],"four":[81],"integrity":[82],"checks":[83],"--":[84,94],"score":[85,125,150],"verification,":[86,90],"specification":[87],"violation,":[88],"reference":[89,121],"method-code":[92,136,156],"alignment":[93,137,157],"apply":[95],"uniformly":[96],"all":[98,167],"systems.":[99],"Across":[100],"75":[101],"papers":[102],"spanning":[103,177],"five":[104,107,168],"systems":[105],"frontier":[108],"tasks,":[110],"baseline":[112],"exhibits":[113],"at":[114],"least":[115],"one":[116],"systematic":[117],"failure":[118],"mode:":[119],"hallucinated":[120,146],"rates":[122],"reach":[123],"21%,":[124],"verification":[126,151],"passes":[127],"in":[128],"as":[129,131],"few":[130],"42%":[132],"of":[133],"papers,":[134],"ranges":[138],"20%":[140],"80%.":[142],"ScientistOne":[143,170],"achieves":[144],"zero":[145],"references":[147],"(0/337),":[148],"perfect":[149],"(12/12),":[152],"highest":[155],"(14/15),":[158],"while":[159],"matching":[160],"or":[161],"exceeding":[162],"human":[163],"expert":[164],"performance":[165],"on":[166,189,195],"tasks.":[169],"further":[171],"generalizes":[172],"six":[174],"additional":[175],"tasks":[176,197],"medical":[178],"imaging,":[179],"fine-grained":[180],"recognition,":[181],"3D":[182],"perception,":[183],"language":[185],"modeling,":[186],"achieving":[187],"state-of-the-art":[188],"Parameter":[190],"Golf":[191],"gold":[193],"medals":[194],"MLE-Bench":[196],"where":[198],"baselines":[199],"fail":[200],"entirely.":[201]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-28T00:00:00"}
