{"id":"https://openalex.org/W4405963525","doi":"https://doi.org/10.1142/s2717554524500140","title":"Leveraging Large Language Models for Speech De-Identification","display_name":"Leveraging Large Language Models for Speech De-Identification","publication_year":2024,"publication_date":"2024-12-31","ids":{"openalex":"https://openalex.org/W4405963525","doi":"https://doi.org/10.1142/s2717554524500140"},"language":"en","primary_location":{"id":"doi:10.1142/s2717554524500140","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s2717554524500140","pdf_url":null,"source":{"id":"https://openalex.org/S4210231678","display_name":"International Journal of Asian Language Processing","issn_l":"2424-791X","issn":["2424-791X","2717-5545"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Asian Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5107100236","display_name":"Priyanshu Dhingra","orcid":null},"institutions":[{"id":"https://openalex.org/I98210582","display_name":"Rajiv Gandhi Institute of Petroleum Technology","ror":"https://ror.org/00n7swc17","country_code":"IN","type":"education","lineage":["https://openalex.org/I98210582"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Priyanshu Dhingra","raw_affiliation_strings":["Rajiv Gandhi Institute of Petroleum Technology, Mubarakpur Mukhatiya, Uttar Pradesh 229305, India"],"raw_orcid":"https://orcid.org/0009-0007-7650-0756","affiliations":[{"raw_affiliation_string":"Rajiv Gandhi Institute of Petroleum Technology, Mubarakpur Mukhatiya, Uttar Pradesh 229305, India","institution_ids":["https://openalex.org/I98210582"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Satyam Agrawal","orcid":"https://orcid.org/0009-0002-9032-0739"},"institutions":[{"id":"https://openalex.org/I11880225","display_name":"National Institute of Technology Karnataka","ror":"https://ror.org/01hz4v948","country_code":"IN","type":"education","lineage":["https://openalex.org/I11880225"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Satyam Agrawal","raw_affiliation_strings":["National Institute of Technology Karnataka, Mangaluru, Karnataka 575025, India"],"raw_orcid":"https://orcid.org/0009-0002-9032-0739","affiliations":[{"raw_affiliation_string":"National Institute of Technology Karnataka, Mangaluru, Karnataka 575025, India","institution_ids":["https://openalex.org/I11880225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075624536","display_name":"Chandra Sekar Veerappan","orcid":null},"institutions":[{"id":"https://openalex.org/I168639165","display_name":"Singapore Institute of Technology","ror":"https://ror.org/01v2c2791","country_code":"SG","type":"education","lineage":["https://openalex.org/I168639165"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Chandra Sekar Veerappan","raw_affiliation_strings":["Singapore Institute of Technology, Singapore 828608, Singapore"],"raw_orcid":"https://orcid.org/0000-0003-0948-0568","affiliations":[{"raw_affiliation_string":"Singapore Institute of Technology, Singapore 828608, Singapore","institution_ids":["https://openalex.org/I168639165"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070872826","display_name":"Eng Siong Chng","orcid":"https://orcid.org/0000-0001-6257-7399"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Eng Siong Chng","raw_affiliation_strings":["Nanyang Technological University, Singapore 639798, Singapore"],"raw_orcid":"https://orcid.org/0000-0001-6257-7399","affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore 639798, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5055221016","display_name":"Rong Tong","orcid":"https://orcid.org/0000-0003-3410-8354"},"institutions":[{"id":"https://openalex.org/I168639165","display_name":"Singapore Institute of Technology","ror":"https://ror.org/01v2c2791","country_code":"SG","type":"education","lineage":["https://openalex.org/I168639165"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Rong Tong","raw_affiliation_strings":["Singapore Institute of Technology, Singapore 828608, Singapore"],"raw_orcid":"https://orcid.org/0000-0003-3410-8354","affiliations":[{"raw_affiliation_string":"Singapore Institute of Technology, Singapore 828608, Singapore","institution_ids":["https://openalex.org/I168639165"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.3055,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.68133443,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":"35","issue":"01","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.8939999938011169,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.8939999938011169,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.8338000178337097,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.6686235666275024},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6568448543548584},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4443347156047821},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3728496730327606},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.3637802004814148},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32969117164611816},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.07349392771720886},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.07081079483032227}],"concepts":[{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.6686235666275024},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6568448543548584},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4443347156047821},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3728496730327606},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.3637802004814148},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32969117164611816},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.07349392771720886},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.07081079483032227},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1142/s2717554524500140","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s2717554524500140","pdf_url":null,"source":{"id":"https://openalex.org/S4210231678","display_name":"International Journal of Asian Language Processing","issn_l":"2424-791X","issn":["2424-791X","2717-5545"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Asian Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6100000143051147,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G6346085426","display_name":null,"funder_award_id":"R-IE2-A405-00006","funder_id":"https://openalex.org/F4320320751","funder_display_name":"Ministry of Education - Singapore"},{"id":"https://openalex.org/G6783339877","display_name":null,"funder_award_id":"R-R12-A405-0009","funder_id":"https://openalex.org/F4320320751","funder_display_name":"Ministry of Education - Singapore"}],"funders":[{"id":"https://openalex.org/F4320320751","display_name":"Ministry of Education - Singapore","ror":"https://ror.org/01kcva023"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W2406932913","https://openalex.org/W2407080277","https://openalex.org/W2621075239","https://openalex.org/W2888807255","https://openalex.org/W2914417638","https://openalex.org/W2963956191","https://openalex.org/W2973072704","https://openalex.org/W3011594683","https://openalex.org/W3104182623","https://openalex.org/W3125532488","https://openalex.org/W3127800809","https://openalex.org/W3163839574","https://openalex.org/W4221139374","https://openalex.org/W4297841645","https://openalex.org/W4309773749","https://openalex.org/W4388291822","https://openalex.org/W4390872952","https://openalex.org/W4396759394","https://openalex.org/W4402390097","https://openalex.org/W4406266018"],"related_works":["https://openalex.org/W2898732673","https://openalex.org/W2410053581","https://openalex.org/W2383658677","https://openalex.org/W3123203398","https://openalex.org/W1972473893","https://openalex.org/W2466435674","https://openalex.org/W2765200542","https://openalex.org/W2367893528","https://openalex.org/W3107784576","https://openalex.org/W3204019825"],"abstract_inverted_index":{"This":[0,51],"paper":[1],"presents":[2],"a":[3,16,25,31],"novel":[4],"approach":[5,84],"to":[6,57],"address":[7],"the":[8,59,82,93,104,112,115],"scarcity":[9],"of":[10,106,114],"labeled":[11],"data":[12,34,42,108],"in":[13,118],"speech":[14,40,87],"de-identification,":[15],"critical":[17],"task":[18],"for":[19],"protecting":[20],"personal":[21],"privacy.":[22],"By":[23],"leveraging":[24],"large":[26],"language":[27],"model,":[28],"we":[29,74],"propose":[30],"fully":[32],"automated":[33],"augmentation":[35,109],"strategy":[36,110],"that":[37],"generates":[38],"synthetic":[39],"text":[41],"enriched":[43],"with":[44],"diverse":[45],"personally":[46],"identifiable":[47],"information":[48],"(PII)":[49],"entities.":[50],"augmented":[52],"dataset":[53],"is":[54],"then":[55],"used":[56],"train":[58],"speech-de-identification":[60],"models,":[61],"significantly":[62],"improving":[63,119],"its":[64],"performance":[65],"on":[66],"spoken":[67],"language.":[68],"To":[69],"further":[70],"enhance":[71],"de-identification":[72],"accuracy,":[73],"explore":[75],"both":[76],"pipeline":[77,83],"and":[78,89,111,123],"end-to-end":[79,94,116],"models.":[80],"While":[81],"sequentially":[85],"applies":[86],"recognition":[88],"named":[90],"entity":[91],"recognition,":[92],"model":[95,117],"jointly":[96],"learns":[97],"these":[98],"tasks.":[99],"Our":[100],"experimental":[101],"results":[102],"demonstrate":[103],"effectiveness":[105],"our":[107],"superiority":[113],"PII":[120],"detection":[121],"accuracy":[122],"robustness.":[124]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
