{"id":"https://openalex.org/W7148578828","doi":"https://doi.org/10.1109/asru65441.2025.11434612","title":"LLM-Based Dictation Detection from Doctor-Patient Conversations","display_name":"LLM-Based Dictation Detection from Doctor-Patient Conversations","publication_year":2025,"publication_date":"2025-12-06","ids":{"openalex":"https://openalex.org/W7148578828","doi":"https://doi.org/10.1109/asru65441.2025.11434612"},"language":null,"primary_location":{"id":"doi:10.1109/asru65441.2025.11434612","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru65441.2025.11434612","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132766934","display_name":"Siyuan Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I4210123366","display_name":"Health Information Management","ror":"https://ror.org/02zmq8s40","country_code":"BE","type":"other","lineage":["https://openalex.org/I4210123366"]}],"countries":["BE"],"is_corresponding":true,"raw_author_name":"Siyuan Chen","raw_affiliation_strings":["Solventum Health Information Systems"],"affiliations":[{"raw_affiliation_string":"Solventum Health Information Systems","institution_ids":["https://openalex.org/I4210123366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004024479","display_name":"Mojtaba Kadkhodaie Elyaderani","orcid":null},"institutions":[{"id":"https://openalex.org/I4210123366","display_name":"Health Information Management","ror":"https://ror.org/02zmq8s40","country_code":"BE","type":"other","lineage":["https://openalex.org/I4210123366"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Mojtaba Kadkhodaie Elyaderani","raw_affiliation_strings":["Solventum Health Information Systems"],"affiliations":[{"raw_affiliation_string":"Solventum Health Information Systems","institution_ids":["https://openalex.org/I4210123366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132779530","display_name":"Jing Su","orcid":null},"institutions":[{"id":"https://openalex.org/I4210123366","display_name":"Health Information Management","ror":"https://ror.org/02zmq8s40","country_code":"BE","type":"other","lineage":["https://openalex.org/I4210123366"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Jing Su","raw_affiliation_strings":["Solventum Health Information Systems"],"affiliations":[{"raw_affiliation_string":"Solventum Health Information Systems","institution_ids":["https://openalex.org/I4210123366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050036240","display_name":"Susanne B\u00fcrger","orcid":null},"institutions":[{"id":"https://openalex.org/I4210123366","display_name":"Health Information Management","ror":"https://ror.org/02zmq8s40","country_code":"BE","type":"other","lineage":["https://openalex.org/I4210123366"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Susanne Burger","raw_affiliation_strings":["Solventum Health Information Systems"],"affiliations":[{"raw_affiliation_string":"Solventum Health Information Systems","institution_ids":["https://openalex.org/I4210123366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010424125","display_name":"Thomas Schaaf","orcid":"https://orcid.org/0000-0002-9569-4759"},"institutions":[{"id":"https://openalex.org/I4210123366","display_name":"Health Information Management","ror":"https://ror.org/02zmq8s40","country_code":"BE","type":"other","lineage":["https://openalex.org/I4210123366"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Thomas Schaaf","raw_affiliation_strings":["Solventum Health Information Systems"],"affiliations":[{"raw_affiliation_string":"Solventum Health Information Systems","institution_ids":["https://openalex.org/I4210123366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5132766934"],"corresponding_institution_ids":["https://openalex.org/I4210123366"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.87579489,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3707999885082245,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3707999885082245,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.2021999955177307,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.0835999995470047,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dictation","display_name":"Dictation","score":0.37439998984336853},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.2766000032424927},{"id":"https://openalex.org/keywords/conjunction","display_name":"Conjunction (astronomy)","score":0.21739999949932098},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.211899995803833}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.600600004196167},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4722999930381775},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4203999936580658},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.38999998569488525},{"id":"https://openalex.org/C2779077324","wikidata":"https://www.wikidata.org/wiki/Q1087138","display_name":"Dictation","level":2,"score":0.37439998984336853},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2766000032424927},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.22300000488758087},{"id":"https://openalex.org/C59656382","wikidata":"https://www.wikidata.org/wiki/Q191536","display_name":"Conjunction (astronomy)","level":2,"score":0.21739999949932098},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.2167000025510788},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.211899995803833}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/asru65441.2025.11434612","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru65441.2025.11434612","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W2754624876","https://openalex.org/W2786232884","https://openalex.org/W3045635560","https://openalex.org/W3083029406","https://openalex.org/W3177464472","https://openalex.org/W3201710275","https://openalex.org/W4210521413","https://openalex.org/W4297841431","https://openalex.org/W4385571397","https://openalex.org/W4386492483","https://openalex.org/W4387321091","https://openalex.org/W4391745701","https://openalex.org/W4399083018","https://openalex.org/W4411379405","https://openalex.org/W4415433498"],"related_works":[],"abstract_inverted_index":{"Clinical":[0],"ambient":[1],"documentation":[2],"systems":[3],"need":[4],"to":[5,11,21,50],"detect":[6,22],"dictation":[7,23,42,133],"from":[8],"doctor-patient":[9],"conversations":[10],"ensure":[12],"critical":[13],"statements":[14],"are":[15],"properly":[16],"recorded.":[17],"Existing":[18],"methods":[19],"struggle":[20],"interleaved":[24],"within":[25],"conversational":[26],"exchanges.":[27],"We":[28,115],"investigated":[29],"LLM-based":[30],"approaches:":[31],"zero-shot,":[32],"multi-shot,":[33],"manual/auto":[34],"prompt":[35],"tuning,":[36],"and":[37,54,60,78,102],"supervised":[38],"fine-tuning":[39],"for":[40,128],"medical":[41,132],"detection.":[43,134],"A":[44],"word":[45],"alignment-based":[46],"method":[47],"is":[48],"proposed":[49],"mitigate":[51],"ASR":[52],"errors":[53],"LLM":[55,68],"hallucinations":[56],"while":[57],"performing":[58],"utterance-":[59],"word-level":[61,83],"evaluation.":[62],"Supervised":[63],"finetuning":[64],"of":[65,131],"a":[66],"Qwen2-1.5B":[67],"achieves":[69],"the":[70,108,120,124,129],"best":[71],"performance:":[72],"$\\mathbf{9":[73],"0.":[74],"4":[75],"\\%}$":[76,82],"utterance-level":[77],"$\\mathbf{8":[79],"6.":[80],"8":[81],"macro":[84],"F1":[85],"on":[86,92,119],"manual":[87],"transcripts,":[88],"with":[89,99],"minimal":[90],"loss":[91],"ASR.":[93],"This":[94],"surpasses":[95],"Claude":[96],"3.5":[97],"Sonnet":[98],"auto-tuned":[100],"prompts":[101],"multiple":[103],"in-context":[104],"learning":[105],"examples,":[106],"though":[107],"latter":[109],"requires":[110],"much":[111],"less":[112],"training":[113],"data.":[114],"release":[116],"model":[117],"outputs":[118],"ACI-Bench":[121],"dataset,":[122],"providing":[123],"first":[125],"open":[126],"resource":[127],"evaluation":[130]},"counts_by_year":[],"updated_date":"2026-04-03T16:44:17.987007","created_date":"2026-04-03T00:00:00"}
