{"id":"https://openalex.org/W4380136794","doi":"https://doi.org/10.48550/arxiv.2306.05323","title":"Advancing Italian Biomedical Information Extraction with Transformers-based Models: Methodological Insights and Multicenter Practical Application","display_name":"Advancing Italian Biomedical Information Extraction with Transformers-based Models: Methodological Insights and Multicenter Practical Application","publication_year":2023,"publication_date":"2023-06-08","ids":{"openalex":"https://openalex.org/W4380136794","doi":"https://doi.org/10.48550/arxiv.2306.05323"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2306.05323","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.05323","pdf_url":"https://arxiv.org/pdf/2306.05323","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2306.05323","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084685551","display_name":"Claudio Crema","orcid":"https://orcid.org/0000-0003-2537-9742"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Crema, Claudio","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046058191","display_name":"Tommaso Mario Buonocore","orcid":"https://orcid.org/0000-0002-2887-088X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Buonocore, Tommaso Mario","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031124669","display_name":"Silvia Fostinelli","orcid":"https://orcid.org/0000-0003-0120-880X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fostinelli, Silvia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090028219","display_name":"Enea Parimbelli","orcid":"https://orcid.org/0000-0003-0679-828X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Parimbelli, Enea","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066201036","display_name":"Federico Verde","orcid":"https://orcid.org/0000-0002-3977-6995"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Verde, Federico","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078256498","display_name":"Cira Fundar\u00f2","orcid":"https://orcid.org/0000-0002-7810-8885"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fundar\u00f2, Cira","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003077658","display_name":"Marina Manera","orcid":"https://orcid.org/0000-0003-4235-9612"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Manera, Marina","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086608723","display_name":"Matteo Cotta Ramusino","orcid":"https://orcid.org/0000-0003-3090-9648"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ramusino, Matteo Cotta","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055240477","display_name":"Marco Capelli","orcid":"https://orcid.org/0000-0002-4454-366X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Capelli, Marco","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014884119","display_name":"Alfredo Costa","orcid":"https://orcid.org/0000-0001-7312-8011"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Costa, Alfredo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062561725","display_name":"Giuliano Binetti","orcid":"https://orcid.org/0000-0003-2759-5844"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Binetti, Giuliano","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050932220","display_name":"Riccardo Bellazzi","orcid":"https://orcid.org/0000-0002-6974-9808"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bellazzi, Riccardo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5073183618","display_name":"Alberto Redolfi","orcid":"https://orcid.org/0000-0002-4145-9059"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Redolfi, Alberto","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":13,"corresponding_author_ids":["https://openalex.org/A5084685551"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9663000106811523,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7679286003112793},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.7047730684280396},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5436550378799438},{"id":"https://openalex.org/keywords/recall","display_name":"Recall","score":0.5323565006256104},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.49714186787605286},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4898986220359802},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.47089818120002747},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.4668341875076294},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.4478399455547333},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.44176262617111206},{"id":"https://openalex.org/keywords/medical-record","display_name":"Medical record","score":0.41102567315101624},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4053837060928345},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.11948546767234802},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.10059782862663269}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7679286003112793},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.7047730684280396},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5436550378799438},{"id":"https://openalex.org/C100660578","wikidata":"https://www.wikidata.org/wiki/Q18733","display_name":"Recall","level":2,"score":0.5323565006256104},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.49714186787605286},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4898986220359802},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.47089818120002747},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.4668341875076294},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.4478399455547333},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.44176262617111206},{"id":"https://openalex.org/C195910791","wikidata":"https://www.wikidata.org/wiki/Q1324077","display_name":"Medical record","level":2,"score":0.41102567315101624},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4053837060928345},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.11948546767234802},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.10059782862663269},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C126838900","wikidata":"https://www.wikidata.org/wiki/Q77604","display_name":"Radiology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2306.05323","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.05323","pdf_url":"https://arxiv.org/pdf/2306.05323","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2306.05323","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2306.05323","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2306.05323","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2306.05323","pdf_url":"https://arxiv.org/pdf/2306.05323","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.8299999833106995}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4380136794.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2358294942","https://openalex.org/W2405355225","https://openalex.org/W4367460280","https://openalex.org/W2004087619","https://openalex.org/W4321472216","https://openalex.org/W2557094866","https://openalex.org/W2469016277","https://openalex.org/W2362196274","https://openalex.org/W2757101400","https://openalex.org/W2165504147"],"abstract_inverted_index":{"The":[0,107],"introduction":[1],"of":[2,46,115],"computerized":[3],"medical":[4,23,36],"records":[5,24,37],"in":[6,22,149],"hospitals":[7],"has":[8],"reduced":[9],"burdensome":[10],"activities":[11],"like":[12],"manual":[13],"writing":[14],"and":[15,40,76,87,120],"information":[16],"fetching.":[17],"However,":[18],"the":[19,67,112,142],"data":[20,32],"contained":[21],"are":[25],"still":[26],"far":[27],"underutilized,":[28],"primarily":[29],"because":[30],"extracting":[31],"from":[33],"unstructured":[34],"textual":[35],"takes":[38],"time":[39],"effort.":[41],"Information":[42],"Extraction,":[43],"a":[44,81,116,122,130],"subfield":[45],"Natural":[47,145],"Language":[48,146],"Processing,":[49],"can":[50],"help":[51],"clinical":[52],"practitioners":[53],"overcome":[54],"this":[55,63],"limitation":[56],"by":[57],"using":[58],"automated":[59],"text-mining":[60],"pipelines.":[61],"In":[62],"work,":[64],"we":[65,85],"created":[66],"first":[68],"Italian":[69],"neuropsychiatric":[70],"Named":[71],"Entity":[72],"Recognition":[73],"dataset,":[74],"PsyNIT,":[75],"used":[77],"it":[78],"to":[79,93,136],"develop":[80],"Transformers-based":[82],"model.":[83],"Moreover,":[84],"collected":[86],"leveraged":[88],"three":[89],"external":[90],"independent":[91],"datasets":[92],"implement":[94],"an":[95],"effective":[96],"multicenter":[97],"model,":[98],"with":[99,129],"overall":[100],"F1-score":[101],"84.77%,":[102],"Precision":[103],"83.16%,":[104],"Recall":[105],"86.44%.":[106],"lessons":[108],"learned":[109],"are:":[110],"(i)":[111],"crucial":[113],"role":[114],"consistent":[117],"annotation":[118],"process":[119],"(ii)":[121],"fine-tuning":[123],"strategy":[124],"that":[125,140],"combines":[126],"classical":[127],"methods":[128],"\"low-resource\"":[131],"approach.":[132],"This":[133],"allowed":[134],"us":[135],"establish":[137],"methodological":[138],"guidelines":[139],"pave":[141],"way":[143],"for":[144],"Processing":[147],"studies":[148],"less-resourced":[150],"languages.":[151]},"counts_by_year":[],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2023-06-10T00:00:00"}
