{"id":"https://openalex.org/W7155183294","doi":"https://doi.org/10.48550/arxiv.2604.18805","title":"AI scientists produce results without reasoning scientifically","display_name":"AI scientists produce results without reasoning scientifically","publication_year":2026,"publication_date":"2026-04-20","ids":{"openalex":"https://openalex.org/W7155183294","doi":"https://doi.org/10.48550/arxiv.2604.18805"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.18805","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18805","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.18805","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134310068","display_name":"Marti\u00f1o R\u00edos-Garc\u00eda","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"R\u00edos-Garc\u00eda, Marti\u00f1o","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134358686","display_name":"Nawaf Alampara","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alampara, Nawaf","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134304276","display_name":"Chandan Gupta","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gupta, Chandan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006744528","display_name":"Indrajeet Mandal","orcid":"https://orcid.org/0000-0002-8808-4602"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mandal, Indrajeet","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051593420","display_name":"Sajid Mannan","orcid":"https://orcid.org/0000-0002-7887-2250"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mannan, Sajid","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134297591","display_name":"Ali Asghar Aghajani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aghajani, Ali Asghar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134267240","display_name":"N. M. Anoop Krishnan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Krishnan, N. M. Anoop","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134249392","display_name":"Kevin Maik Jablonka","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jablonka, Kevin Maik","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.20080000162124634,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.20080000162124634,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.13650000095367432,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.10859999805688858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.7720999717712402},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5228999853134155},{"id":"https://openalex.org/keywords/scientific-reasoning","display_name":"Scientific reasoning","score":0.474700003862381},{"id":"https://openalex.org/keywords/knowledge-base","display_name":"Knowledge base","score":0.45210000872612},{"id":"https://openalex.org/keywords/model-based-reasoning","display_name":"Model-based reasoning","score":0.39320001006126404},{"id":"https://openalex.org/keywords/scientific-discovery","display_name":"Scientific discovery","score":0.37770000100135803},{"id":"https://openalex.org/keywords/base","display_name":"Base (topology)","score":0.3743000030517578},{"id":"https://openalex.org/keywords/causal-reasoning","display_name":"Causal reasoning","score":0.36039999127388}],"concepts":[{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.7720999717712402},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6093000173568726},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5228999853134155},{"id":"https://openalex.org/C2992562121","wikidata":"https://www.wikidata.org/wiki/Q3817808","display_name":"Scientific reasoning","level":2,"score":0.474700003862381},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.46619999408721924},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.45210000872612},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41280001401901245},{"id":"https://openalex.org/C37335422","wikidata":"https://www.wikidata.org/wiki/Q6888134","display_name":"Model-based reasoning","level":3,"score":0.39320001006126404},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3783000111579895},{"id":"https://openalex.org/C2984917352","wikidata":"https://www.wikidata.org/wiki/Q12772819","display_name":"Scientific discovery","level":2,"score":0.37770000100135803},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.3743000030517578},{"id":"https://openalex.org/C115086926","wikidata":"https://www.wikidata.org/wiki/Q17004651","display_name":"Causal reasoning","level":3,"score":0.36039999127388},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.34529998898506165},{"id":"https://openalex.org/C195732255","wikidata":"https://www.wikidata.org/wiki/Q981008","display_name":"Sociology of scientific knowledge","level":2,"score":0.3395000100135803},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.3246000111103058},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.3176000118255615},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.3077000081539154},{"id":"https://openalex.org/C138379479","wikidata":"https://www.wikidata.org/wiki/Q1116876","display_name":"Scientific modelling","level":2,"score":0.2892000079154968},{"id":"https://openalex.org/C110099512","wikidata":"https://www.wikidata.org/wiki/Q59115","display_name":"Philosophy of science","level":2,"score":0.2842000126838684},{"id":"https://openalex.org/C2781083858","wikidata":"https://www.wikidata.org/wiki/Q17327049","display_name":"Scientific literature","level":2,"score":0.2766000032424927},{"id":"https://openalex.org/C124056412","wikidata":"https://www.wikidata.org/wiki/Q3320364","display_name":"Scientific evidence","level":2,"score":0.27239999175071716},{"id":"https://openalex.org/C108650721","wikidata":"https://www.wikidata.org/wiki/Q1783253","display_name":"Counterfactual thinking","level":2,"score":0.27090001106262207},{"id":"https://openalex.org/C159032336","wikidata":"https://www.wikidata.org/wiki/Q2488768","display_name":"Non-monotonic logic","level":2,"score":0.2639000117778778},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.2540999948978424},{"id":"https://openalex.org/C116222747","wikidata":"https://www.wikidata.org/wiki/Q220888","display_name":"Falsifiability","level":2,"score":0.2540000081062317},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2529999911785126}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.18805","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18805","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.18805","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18805","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"model":[2,67,89],"(LLM)-based":[3],"systems":[4],"are":[5],"increasingly":[6],"deployed":[7],"to":[8,18,42],"conduct":[9],"scientific":[10,24,34,177,188,211],"research":[11],"autonomously,":[12],"yet":[13],"whether":[14,137],"their":[15],"reasoning":[16,134,156,204],"adheres":[17],"the":[19,62,65,69,78,87,91,108,138,161,183,210,221],"epistemic":[20,184],"norms":[21],"that":[22,60,86,186,223],"make":[23],"inquiry":[25],"self-correcting":[26],"is":[27,90,114,130],"poorly":[28],"understood.":[29],"Here,":[30],"we":[31],"evaluate":[32],"LLM-based":[33,174],"agents":[35,152,175,216],"across":[36,165],"eight":[37],"domains,":[38],"spanning":[39],"workflow":[40,143],"execution":[41],"hypothesis-driven":[43,146],"inquiry,":[44],"through":[45],"more":[46],"than":[47],"25,000":[48],"agent":[49,70,82,139],"runs":[50],"and":[51,68,72,97,126,160,196],"two":[52],"complementary":[53],"lenses:":[54],"(i)":[55],"a":[56,74,141,207],"systematic":[57],"performance":[58,96],"analysis":[59,76],"decomposes":[61],"contributions":[63],"of":[64,77,81,94,102,118],"base":[66,88],"scaffold,":[71],"(ii)":[73],"behavioral":[75],"epistemological":[79],"structure":[80],"reasoning.":[83,189],"We":[84],"observe":[85],"primary":[92],"determinant":[93],"both":[95],"behavior,":[98],"accounting":[99],"for":[100,107],"41.4%":[101],"explained":[103],"variance":[104],"versus":[105],"1.5%":[106],"scaffold.":[109],"Across":[110],"all":[111],"configurations,":[112],"evidence":[113,129],"ignored":[115],"in":[116,124,168],"68%":[117],"traces,":[119],"refutation-driven":[120],"belief":[121],"revision":[122],"occurs":[123],"26%,":[125],"convergent":[127],"multi-test":[128],"rare.":[131],"The":[132],"same":[133],"pattern":[135],"appears":[136],"executes":[140],"computational":[142],"or":[144],"conducts":[145],"inquiry.":[147],"They":[148],"persist":[149],"even":[150],"when":[151],"receive":[153],"near-complete":[154],"successful":[155],"trajectories":[157],"as":[158],"context,":[159],"resulting":[162],"unreliability":[163],"compounds":[164],"repeated":[166],"trials":[167],"epistemically":[169],"demanding":[170],"domains.":[171],"Thus,":[172],"current":[173],"execute":[176],"workflows":[178],"but":[179],"do":[180],"not":[181],"exhibit":[182],"patterns":[185],"characterize":[187],"Outcome-based":[190],"evaluation":[191],"cannot":[192,200,217],"detect":[193],"these":[194],"failures,":[195],"scaffold":[197],"engineering":[198],"alone":[199],"repair":[201],"them.":[202],"Until":[203],"itself":[205],"becomes":[206],"training":[208],"target,":[209],"knowledge":[212],"produced":[213],"by":[214,220],"such":[215],"be":[218],"justified":[219],"process":[222],"generated":[224],"it.":[225]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-23T00:00:00"}
