{"id":"https://openalex.org/W7131894664","doi":"https://doi.org/10.48550/arxiv.2602.22216","title":"Retrieval-Augmented Generation Assistant for Anatomical Pathology Laboratories","display_name":"Retrieval-Augmented Generation Assistant for Anatomical Pathology Laboratories","publication_year":2025,"publication_date":"2025-12-08","ids":{"openalex":"https://openalex.org/W7131894664","doi":"https://doi.org/10.48550/arxiv.2602.22216"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2602.22216","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.22216","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2602.22216","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108966975","display_name":"Diogo Pires","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pires, Diogo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114312941","display_name":"Yuriy Perezhohin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Perezhohin, Yuriy","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5127445346","display_name":"Mauro Castelli","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Castelli, Mauro","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.4693000018596649,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.4693000018596649,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.1103999987244606,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.0957999974489212,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.8090000152587891},{"id":"https://openalex.org/keywords/documentation","display_name":"Documentation","score":0.6841999888420105},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5658000111579895},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.5189999938011169},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.4375999867916107},{"id":"https://openalex.org/keywords/health-care","display_name":"Health care","score":0.35370001196861267},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.34049999713897705}],"concepts":[{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.8090000152587891},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6873999834060669},{"id":"https://openalex.org/C56666940","wikidata":"https://www.wikidata.org/wiki/Q788790","display_name":"Documentation","level":2,"score":0.6841999888420105},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5658000111579895},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.5189999938011169},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.446399986743927},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.4375999867916107},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4196999967098236},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3716000020503998},{"id":"https://openalex.org/C160735492","wikidata":"https://www.wikidata.org/wiki/Q31207","display_name":"Health care","level":2,"score":0.35370001196861267},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.34049999713897705},{"id":"https://openalex.org/C203357204","wikidata":"https://www.wikidata.org/wiki/Q1089605","display_name":"Chunking (psychology)","level":2,"score":0.3237000107765198},{"id":"https://openalex.org/C100660578","wikidata":"https://www.wikidata.org/wiki/Q18733","display_name":"Recall","level":2,"score":0.3122999966144562},{"id":"https://openalex.org/C136886441","wikidata":"https://www.wikidata.org/wiki/Q926129","display_name":"Normalization (sociology)","level":2,"score":0.3093999922275543},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.3027999997138977},{"id":"https://openalex.org/C110615152","wikidata":"https://www.wikidata.org/wiki/Q1469824","display_name":"Controlled vocabulary","level":2,"score":0.27889999747276306},{"id":"https://openalex.org/C19527891","wikidata":"https://www.wikidata.org/wiki/Q1120908","display_name":"Medical physics","level":1,"score":0.2777999937534332},{"id":"https://openalex.org/C3020144179","wikidata":"https://www.wikidata.org/wiki/Q10871684","display_name":"Electronic health record","level":3,"score":0.27559998631477356},{"id":"https://openalex.org/C2780932742","wikidata":"https://www.wikidata.org/wiki/Q4915239","display_name":"Biorepository","level":3,"score":0.274399995803833},{"id":"https://openalex.org/C2780385302","wikidata":"https://www.wikidata.org/wiki/Q367158","display_name":"Protocol (science)","level":3,"score":0.2549000084400177},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.2517000138759613}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2602.22216","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.22216","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2602.22216","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.22216","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Accurate":[0],"and":[1,37,46,52,87,104,128,149,171,192,210],"efficient":[2],"access":[3],"to":[4,15,39,60,64,70,196],"laboratory":[5,22,207],"protocols":[6,81],"is":[7,33],"essential":[8],"in":[9,190],"Anatomical":[10],"Pathology":[11],"(AP),":[12],"where":[13],"up":[14],"70%":[16],"of":[17,43,78,156,177],"medical":[18],"decisions":[19],"depend":[20],"on":[21],"diagnoses.":[23],"However,":[24],"static":[25,198],"documentation":[26,199],"such":[27],"as":[28],"printed":[29],"manuals":[30],"or":[31],"PDFs":[32],"often":[34],"outdated,":[35],"fragmented,":[36],"difficult":[38],"search,":[40],"creating":[41],"risks":[42],"workflow":[44,208],"errors":[45],"diagnostic":[47],"delays.":[48],"This":[49],"study":[50],"proposes":[51],"evaluates":[53],"a":[54,75,83,137,164],"Retrieval-Augmented":[55],"Generation":[56],"(RAG)":[57],"assistant":[58],"tailored":[59],"AP":[61,80,178],"laboratories,":[62],"designed":[63],"provide":[65],"technicians":[66],"with":[67],"context-grounded":[68],"answers":[69],"protocol-related":[71],"queries.":[72],"We":[73],"curated":[74],"novel":[76],"corpus":[77],"99":[79],"from":[82],"Portuguese":[84],"healthcare":[85,191],"institution":[86],"constructed":[88],"323":[89],"question-answer":[90],"pairs":[91],"for":[92,186],"systematic":[93],"evaluation.":[94],"Ten":[95],"experiments":[96],"were":[97],"conducted,":[98],"varying":[99],"chunking":[100,127],"strategies,":[101],"retrieval":[102,121,130],"methods,":[103],"embedding":[105,139],"models.":[106],"Performance":[107],"was":[108],"assessed":[109],"using":[110],"the":[111,132,154,174],"RAGAS":[112],"framework":[113],"(faithfulness,":[114],"answer":[115,144],"relevance,":[116],"context":[117,150],"recall)":[118],"alongside":[119],"top-k":[120],"metrics.":[122],"Results":[123],"show":[124],"that":[125,162],"recursive":[126],"hybrid":[129],"delivered":[131],"strongest":[133],"baseline":[134],"performance.":[135],"Incorporating":[136],"biomedical-specific":[138],"model":[140],"(MedEmbed)":[141],"further":[142],"improved":[143],"relevance":[145],"(0.74),":[146],"faithfulness":[147],"(0.70),":[148],"recall":[151],"(0.77),":[152],"showing":[153],"importance":[155],"domain-specialised":[157],"embeddings.":[158],"Top-k":[159],"analysis":[160],"revealed":[161],"retrieving":[163],"single":[165],"top-ranked":[166],"chunk":[167],"(k=1)":[168],"maximized":[169],"efficiency":[170,209],"accuracy,":[172],"reflecting":[173],"modular":[175],"structure":[176],"protocols.":[179],"These":[180],"findings":[181],"highlight":[182],"critical":[183],"design":[184],"considerations":[185],"deploying":[187],"RAG":[188],"systems":[189],"demonstrate":[193],"their":[194],"potential":[195],"transform":[197],"into":[200],"dynamic,":[201],"reliable":[202],"knowledge":[203],"assistants,":[204],"thus":[205],"improving":[206],"supporting":[211],"patient":[212],"safety.":[213]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-02-28T00:00:00"}
