{"id":"https://openalex.org/W4403941828","doi":"https://doi.org/10.1145/3688868.3689200","title":"BURExtract-Llama: An LLM for Clinical Concept Extraction in Breast Ultrasound Reports","display_name":"BURExtract-Llama: An LLM for Clinical Concept Extraction in Breast Ultrasound Reports","publication_year":2024,"publication_date":"2024-10-28","ids":{"openalex":"https://openalex.org/W4403941828","doi":"https://doi.org/10.1145/3688868.3689200"},"language":"en","primary_location":{"id":"doi:10.1145/3688868.3689200","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3688868.3689200","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3688868.3689200","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st International Workshop on Multimedia Computing for Health and Medicine","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3688868.3689200","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056441202","display_name":"Yuxuan Chen","orcid":"https://orcid.org/0000-0002-8589-2583"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yuxuan Chen","raw_affiliation_strings":["New York University, New York, NY, USA"],"raw_orcid":"https://orcid.org/0000-0002-8589-2583","affiliations":[{"raw_affiliation_string":"New York University, New York, NY, USA","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082687421","display_name":"Haoyan Yang","orcid":"https://orcid.org/0009-0003-5145-7289"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Haoyan Yang","raw_affiliation_strings":["New York University, New York, NY, USA"],"raw_orcid":"https://orcid.org/0009-0003-5145-7289","affiliations":[{"raw_affiliation_string":"New York University, New York, NY, USA","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109711448","display_name":"Hengkai Pan","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hengkai Pan","raw_affiliation_strings":["Carnegie Mellon University, Pittsburgh, PA, USA"],"raw_orcid":"https://orcid.org/0009-0000-6446-2392","affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058325675","display_name":"Fardeen Siddiqui","orcid":"https://orcid.org/0000-0003-3433-4300"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fardeen Siddiqui","raw_affiliation_strings":["NYU Langone Health, New York, USA"],"raw_orcid":"https://orcid.org/0000-0003-3433-4300","affiliations":[{"raw_affiliation_string":"NYU Langone Health, New York, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079380037","display_name":"Antonio Verdone","orcid":null},"institutions":[{"id":"https://openalex.org/I4210086933","display_name":"NYU Langone Health","ror":"https://ror.org/005dvqh91","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I4210086933"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Antonio Verdone","raw_affiliation_strings":["NYU Langone Health, New York, NY, USA"],"raw_orcid":"https://orcid.org/0009-0000-4420-9701","affiliations":[{"raw_affiliation_string":"NYU Langone Health, New York, NY, USA","institution_ids":["https://openalex.org/I4210086933"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Qingyang Zhang","orcid":"https://orcid.org/0009-0003-4726-7378"},"institutions":[{"id":"https://openalex.org/I258800397","display_name":"New York University Shanghai","ror":"https://ror.org/02vpsdb40","country_code":"CN","type":"education","lineage":["https://openalex.org/I258800397","https://openalex.org/I57206974"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qingyang Zhang","raw_affiliation_strings":["NYU Shanghai, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0003-4726-7378","affiliations":[{"raw_affiliation_string":"NYU Shanghai, Shanghai, China","institution_ids":["https://openalex.org/I258800397"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078511139","display_name":"Sumit Chopra","orcid":"https://orcid.org/0009-0009-6637-2230"},"institutions":[{"id":"https://openalex.org/I4210086933","display_name":"NYU Langone Health","ror":"https://ror.org/005dvqh91","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I4210086933"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sumit Chopra","raw_affiliation_strings":["NYU Langone Health, New York, NY, USA"],"raw_orcid":"https://orcid.org/0009-0009-6637-2230","affiliations":[{"raw_affiliation_string":"NYU Langone Health, New York, NY, USA","institution_ids":["https://openalex.org/I4210086933"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101462636","display_name":"Chen Zhao","orcid":"https://orcid.org/0000-0001-7672-146X"},"institutions":[{"id":"https://openalex.org/I258800397","display_name":"New York University Shanghai","ror":"https://ror.org/02vpsdb40","country_code":"CN","type":"education","lineage":["https://openalex.org/I258800397","https://openalex.org/I57206974"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chen Zhao","raw_affiliation_strings":["NYU Shanghai, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-7672-146X","affiliations":[{"raw_affiliation_string":"NYU Shanghai, Shanghai, China","institution_ids":["https://openalex.org/I258800397"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5003735451","display_name":"Yiqiu Shen","orcid":"https://orcid.org/0000-0002-7726-2514"},"institutions":[{"id":"https://openalex.org/I4210086933","display_name":"NYU Langone Health","ror":"https://ror.org/005dvqh91","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I4210086933"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yiqiu Shen","raw_affiliation_strings":["NYU Langone Health, New York, NY, USA"],"raw_orcid":"https://orcid.org/0000-0002-7726-2514","affiliations":[{"raw_affiliation_string":"NYU Langone Health, New York, NY, USA","institution_ids":["https://openalex.org/I4210086933"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5056441202"],"corresponding_institution_ids":["https://openalex.org/I57206974"],"apc_list":null,"apc_paid":null,"fwci":1.336,"has_fulltext":true,"cited_by_count":6,"citation_normalized_percentile":{"value":0.80826055,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"53","last_page":"58"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.98089998960495,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ultrasound","display_name":"Ultrasound","score":0.6172350645065308},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5683786273002625},{"id":"https://openalex.org/keywords/extraction","display_name":"Extraction (chemistry)","score":0.5532302260398865},{"id":"https://openalex.org/keywords/breast-ultrasound","display_name":"Breast ultrasound","score":0.4837739169597626},{"id":"https://openalex.org/keywords/medical-physics","display_name":"Medical physics","score":0.3219592571258545},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.3084298372268677},{"id":"https://openalex.org/keywords/radiology","display_name":"Radiology","score":0.2873057723045349},{"id":"https://openalex.org/keywords/mammography","display_name":"Mammography","score":0.2636556625366211},{"id":"https://openalex.org/keywords/breast-cancer","display_name":"Breast cancer","score":0.12187159061431885},{"id":"https://openalex.org/keywords/internal-medicine","display_name":"Internal medicine","score":0.11714616417884827},{"id":"https://openalex.org/keywords/chromatography","display_name":"Chromatography","score":0.09691041707992554},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.07384231686592102}],"concepts":[{"id":"https://openalex.org/C143753070","wikidata":"https://www.wikidata.org/wiki/Q162564","display_name":"Ultrasound","level":2,"score":0.6172350645065308},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5683786273002625},{"id":"https://openalex.org/C4725764","wikidata":"https://www.wikidata.org/wiki/Q844704","display_name":"Extraction (chemistry)","level":2,"score":0.5532302260398865},{"id":"https://openalex.org/C2777423100","wikidata":"https://www.wikidata.org/wiki/Q1888238","display_name":"Breast ultrasound","level":5,"score":0.4837739169597626},{"id":"https://openalex.org/C19527891","wikidata":"https://www.wikidata.org/wiki/Q1120908","display_name":"Medical physics","level":1,"score":0.3219592571258545},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.3084298372268677},{"id":"https://openalex.org/C126838900","wikidata":"https://www.wikidata.org/wiki/Q77604","display_name":"Radiology","level":1,"score":0.2873057723045349},{"id":"https://openalex.org/C2780472235","wikidata":"https://www.wikidata.org/wiki/Q324634","display_name":"Mammography","level":4,"score":0.2636556625366211},{"id":"https://openalex.org/C530470458","wikidata":"https://www.wikidata.org/wiki/Q128581","display_name":"Breast cancer","level":3,"score":0.12187159061431885},{"id":"https://openalex.org/C126322002","wikidata":"https://www.wikidata.org/wiki/Q11180","display_name":"Internal medicine","level":1,"score":0.11714616417884827},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.09691041707992554},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.07384231686592102},{"id":"https://openalex.org/C121608353","wikidata":"https://www.wikidata.org/wiki/Q12078","display_name":"Cancer","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3688868.3689200","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3688868.3689200","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3688868.3689200","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st International Workshop on Multimedia Computing for Health and Medicine","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3688868.3689200","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3688868.3689200","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3688868.3689200","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st International Workshop on Multimedia Computing for Health and Medicine","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4403941828.pdf","grobid_xml":"https://content.openalex.org/works/W4403941828.grobid-xml"},"referenced_works_count":8,"referenced_works":["https://openalex.org/W1504212872","https://openalex.org/W2003798170","https://openalex.org/W2115570566","https://openalex.org/W3095092693","https://openalex.org/W4212774754","https://openalex.org/W4291617889","https://openalex.org/W4379379356","https://openalex.org/W4380591192"],"related_works":["https://openalex.org/W3108039862","https://openalex.org/W2618954822","https://openalex.org/W1990605602","https://openalex.org/W31474833","https://openalex.org/W2348815573","https://openalex.org/W4283075545","https://openalex.org/W2896805445","https://openalex.org/W2101706338","https://openalex.org/W2133314627","https://openalex.org/W2013481827"],"abstract_inverted_index":{"Breast":[0],"ultrasound":[1],"plays":[2],"a":[3,73,93,101,108],"pivotal":[4],"role":[5],"in":[6],"detecting":[7],"and":[8,23,47,61,156],"diagnosing":[9],"breast":[10],"abnormalities.":[11],"Radiology":[12],"reports":[13,111],"summarize":[14],"key":[15],"findings":[16,132],"from":[17,84],"these":[18,85],"examinations,":[19],"highlighting":[20],"lesion":[21],"characteristics":[22],"malignancy":[24],"assessments.":[25],"However,":[26],"extracting":[27],"this":[28,104],"critical":[29],"information":[30,83],"is":[31,126,136],"challenging":[32],"due":[33],"to":[34,80,91,138],"the":[35,115,147],"unstructured":[36],"nature":[37],"of":[38,96,110,123,149],"radiology":[39],"reports,":[40],"which":[41,125],"often":[42],"exhibit":[43],"varied":[44],"linguistic":[45],"styles":[46],"inconsistent":[48],"formatting.":[49],"While":[50],"proprietary":[51],"LLMs":[52],"like":[53],"GPT-4":[54,90,150],"effectively":[55],"retrieve":[56],"information,":[57],"they":[58],"are":[59],"costly":[60],"raise":[62],"privacy":[63],"concerns":[64],"when":[65],"handling":[66],"protected":[67],"health":[68],"information.":[69],"This":[70],"study":[71],"presents":[72],"pipeline":[74],"for":[75],"developing":[76],"an":[77,119,140],"in-house":[78,141],"LLM":[79,142],"extract":[81],"clinical":[82],"reports.":[86],"We":[87],"first":[88],"utilize":[89],"create":[92],"small":[94],"subset":[95,109],"labeled":[97],"data,":[98],"then":[99],"fine-tune":[100],"Llama3-8B":[102],"using":[103],"dataset.":[105],"Evaluated":[106],"on":[107,127],"annotated":[112],"by":[113],"clinicians,":[114],"proposed":[116],"model":[117],"achieves":[118],"average":[120],"F1":[121],"score":[122],"84.6%,":[124],"par":[128],"with":[129],"GPT-4.":[130],"Our":[131],"demonstrate":[133],"that":[134,143],"it":[135],"feasible":[137],"develop":[139],"not":[144],"only":[145],"matches":[146],"performance":[148],"but":[151],"also":[152],"offers":[153],"cost":[154],"reductions":[155],"enhanced":[157],"data":[158],"privacy.":[159]},"counts_by_year":[{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
