{"id":"https://openalex.org/W7152379983","doi":"https://doi.org/10.48550/arxiv.2604.06403","title":"FMI@SU ToxHabits: Evaluating LLMs Performance on Toxic Habit Extraction in Spanish Clinical Texts","display_name":"FMI@SU ToxHabits: Evaluating LLMs Performance on Toxic Habit Extraction in Spanish Clinical Texts","publication_year":2026,"publication_date":"2026-04-07","ids":{"openalex":"https://openalex.org/W7152379983","doi":"https://doi.org/10.48550/arxiv.2604.06403"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.06403","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.06403","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.06403","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003348604","display_name":"Sylvia Vassileva","orcid":"https://orcid.org/0000-0002-2257-0659"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vassileva, Sylvia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133314072","display_name":"Ivan Koychev","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Koychev, Ivan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5044704545","display_name":"Svetla Boytcheva","orcid":"https://orcid.org/0000-0002-5542-9168"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Boytcheva, Svetla","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.4032000005245209,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.4032000005245209,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.2004999965429306,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.06369999796152115,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/habit","display_name":"Habit","score":0.5267999768257141},{"id":"https://openalex.org/keywords/test","display_name":"Test (biology)","score":0.33719998598098755},{"id":"https://openalex.org/keywords/risk-assessment","display_name":"Risk assessment","score":0.32580000162124634},{"id":"https://openalex.org/keywords/substance-abuse","display_name":"Substance abuse","score":0.28029999136924744}],"concepts":[{"id":"https://openalex.org/C44670240","wikidata":"https://www.wikidata.org/wiki/Q1299714","display_name":"Habit","level":2,"score":0.5267999768257141},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38960000872612},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3467000126838684},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.33719998598098755},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.33480000495910645},{"id":"https://openalex.org/C12174686","wikidata":"https://www.wikidata.org/wiki/Q1058438","display_name":"Risk assessment","level":2,"score":0.32580000162124634},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3190000057220459},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.31790000200271606},{"id":"https://openalex.org/C99454951","wikidata":"https://www.wikidata.org/wiki/Q932068","display_name":"Environmental health","level":1,"score":0.28519999980926514},{"id":"https://openalex.org/C40010229","wikidata":"https://www.wikidata.org/wiki/Q3184856","display_name":"Substance abuse","level":2,"score":0.28029999136924744}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.06403","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.06403","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.06403","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.06403","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Good health and well-being","score":0.7556477189064026,"id":"https://metadata.un.org/sdg/3"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0,17],"paper":[1],"presents":[2],"an":[3,87],"approach":[4,18],"for":[5,21,63,100],"the":[6,22,64,79,93],"recognition":[7],"of":[8,60,90],"toxic":[9],"habits":[10],"named":[11,102],"entities":[12,103],"in":[13,29,41,48,81,104],"Spanish":[14],"clinical":[15,42],"texts.":[16],"was":[19],"developed":[20],"ToxHabits":[23],"Shared":[24],"Task.":[25],"Our":[26,84],"team":[27],"participated":[28],"subtask":[30],"1,":[31],"which":[32],"aims":[33],"to":[34],"detect":[35],"substance":[36],"use":[37],"and":[38,45,54,69,72],"abuse":[39],"mentions":[40],"case":[43],"reports":[44],"classify":[46],"them":[47],"four":[49],"categories":[50],"(Tobacco,":[51],"Alcohol,":[52],"Cannabis,":[53],"Drug).":[55],"We":[56],"explored":[57],"various":[58],"methods":[59],"utilizing":[61],"LLMs":[62],"task,":[65],"including":[66],"zero-shot,":[67],"few-shot,":[68],"prompt":[70],"optimization,":[71],"found":[73],"that":[74],"GPT-4.1's":[75],"few-shot":[76],"prompting":[77],"performed":[78],"best":[80],"our":[82],"experiments.":[83],"method":[85],"achieved":[86],"F1":[88],"score":[89],"0.65":[91],"on":[92],"test":[94],"set,":[95],"demonstrating":[96],"a":[97],"promising":[98],"result":[99],"recognizing":[101],"languages":[105],"other":[106],"than":[107],"English.":[108]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-10T00:00:00"}
