{"id":"https://openalex.org/W7153203263","doi":"https://doi.org/10.48550/arxiv.2604.07964","title":"Are we still able to recognize pearls? Machine-driven peer review and the risk to creativity: An explainable RAG-XAI detection framework with markers extraction","display_name":"Are we still able to recognize pearls? Machine-driven peer review and the risk to creativity: An explainable RAG-XAI detection framework with markers extraction","publication_year":2026,"publication_date":"2026-04-09","ids":{"openalex":"https://openalex.org/W7153203263","doi":"https://doi.org/10.48550/arxiv.2604.07964"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.07964","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07964","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.07964","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053622442","display_name":"Alin-Gabriel V\u0103duva","orcid":"https://orcid.org/0009-0008-1825-4945"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"V\u0103duva, Alin-Gabriel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121145332","display_name":"Simona-Vasilica Oprea","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oprea, Simona-Vasilica","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133388085","display_name":"Adela B\u00e2ra","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"B\u00e2ra, Adela","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.8174999952316284,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.8174999952316284,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.04410000145435333,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10102","display_name":"scientometrics and bibliometrics research","score":0.017100000753998756,"subfield":{"id":"https://openalex.org/subfields/1804","display_name":"Statistics, Probability and Uncertainty"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.47769999504089355},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.47049999237060547},{"id":"https://openalex.org/keywords/accountability","display_name":"Accountability","score":0.42160001397132874},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.41920000314712524},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4025999903678894},{"id":"https://openalex.org/keywords/automation","display_name":"Automation","score":0.4004000127315521},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.3880999982357025},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.38659998774528503}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7297999858856201},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.47769999504089355},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.47049999237060547},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46050000190734863},{"id":"https://openalex.org/C2776007630","wikidata":"https://www.wikidata.org/wiki/Q2798912","display_name":"Accountability","level":2,"score":0.42160001397132874},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.41920000314712524},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.40849998593330383},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4025999903678894},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.4004000127315521},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3917999863624573},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.3880999982357025},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.38659998774528503},{"id":"https://openalex.org/C2778827112","wikidata":"https://www.wikidata.org/wiki/Q22245680","display_name":"Feature engineering","level":3,"score":0.3522000014781952},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.33320000767707825},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.31299999356269836},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.30970001220703125},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.29919999837875366},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.295199990272522},{"id":"https://openalex.org/C151956035","wikidata":"https://www.wikidata.org/wiki/Q1132755","display_name":"Logistic regression","level":2,"score":0.2863999903202057},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.2847000062465668},{"id":"https://openalex.org/C2776141515","wikidata":"https://www.wikidata.org/wiki/Q1274479","display_name":"Repetition (rhetorical device)","level":2,"score":0.28130000829696655},{"id":"https://openalex.org/C22607594","wikidata":"https://www.wikidata.org/wiki/Q5375150","display_name":"Enabling","level":2,"score":0.26440000534057617},{"id":"https://openalex.org/C62230096","wikidata":"https://www.wikidata.org/wiki/Q275969","display_name":"Crowdsourcing","level":2,"score":0.2624000012874603},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.259799987077713},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2565999925136566}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.07964","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07964","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.07964","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07964","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0,144],"integration":[1],"of":[2,21,165,204,235],"large":[3],"language":[4],"models":[5],"(LLMs)":[6],"into":[7],"peer":[8],"review":[9,125],"raises":[10],"a":[11,48],"concern":[12],"beyond":[13],"authorship":[14],"and":[15,79,127,140,155,163,179,199,207],"detection:":[16],"the":[17,22,56,168,186,211,215,228,233,236],"potential":[18],"cascading":[19],"automation":[20],"entire":[23],"editorial":[24,37],"process.":[25],"As":[26],"reviews":[27],"become":[28],"partially":[29],"or":[30],"fully":[31,49],"machine-generated,":[32],"it":[33],"becomes":[34],"plausible":[35],"that":[36,67,82,89],"decisions":[38],"may":[39,70],"also":[40],"be":[41],"delegated":[42],"to":[43,47,94,102,136],"algorithmic":[44,107],"systems,":[45],"leading":[46],"automated":[50,129],"evaluation":[51],"pipeline.":[52],"They":[53],"risk":[54],"reshaping":[55],"criteria":[57],"by":[58],"which":[59],"scientific":[60],"work":[61,105],"is":[62],"assessed.":[63],"This":[64],"paper":[65],"argues":[66],"machine-driven":[68],"assessment":[69],"systematically":[71],"favor":[72],"standardized,":[73],"pattern-conforming":[74],"research":[75],"while":[76,171],"penalizing":[77],"unconventional":[78],"paradigm-shifting":[80],"ideas":[81],"require":[83],"contextual":[84],"human":[85],"judgment.":[86],"We":[87],"consider":[88],"this":[90,115],"shift":[91],"could":[92],"lead":[93],"epistemic":[95],"homogenization,":[96],"where":[97],"researchers":[98],"are":[99],"implicitly":[100],"incentivized":[101],"optimize":[103],"their":[104],"for":[106,123],"approval":[108],"rather":[109],"than":[110],"genuine":[111],"discovery.":[112],"To":[113],"address":[114],"risk,":[116],"we":[117],"introduce":[118],"an":[119],"explainable":[120],"framework":[121,146],"(RAG-XAI)":[122],"assessing":[124],"quality":[126],"detecting":[128],"patterns":[130,209],"using":[131],"markers":[132],"LLM":[133],"extractor,":[134],"aiming":[135],"preserve":[137],"transparency,":[138],"accountability":[139],"creativity":[141],"in":[142,227],"science.":[143],"proposed":[145],"achieves":[147,218],"near-perfect":[148],"detection":[149],"performance,":[150],"with":[151,223],"XGBoost,":[152],"Random":[153],"Forest":[154],"LightGBM":[156],"reaching":[157],"99.61%":[158],"accuracy,":[159,194,222],"AUC-ROC":[160],"above":[161],"0.999":[162],"F1-scores":[164],"0.9925":[166],"on":[167],"test":[169],"set,":[170],"maintaining":[172],"extremely":[173],"low":[174],"false":[175,180],"positive":[176],"rates":[177,182],"(&lt;0.23%)":[178],"negative":[181],"(~0.8%).":[183],"In":[184],"contrast,":[185],"logistic":[187],"regression":[188],"baseline":[189],"performs":[190],"substantially":[191],"worse":[192],"(89.97%":[193],"F1-score":[195],"0.8314).":[196],"Feature":[197],"importance":[198],"SHAP":[200],"analyses":[201],"identify":[202],"absence":[203],"personal":[205],"signals":[206],"repetition":[208],"as":[210],"dominant":[212],"predictors.":[213],"Additionally,":[214],"RAG":[216],"component":[217],"90.5%":[219],"top-1":[220],"retrieval":[221],"strong":[224],"same-class":[225],"clustering":[226],"embedding":[229],"space,":[230],"further":[231],"supporting":[232],"reliability":[234],"framework's":[237],"outputs.":[238]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-11T00:00:00"}
