{"id":"https://openalex.org/W7143511642","doi":"https://doi.org/10.48550/arxiv.2603.26246","title":"Distilling Conversations: Abstract Compression of Conversational Audio Context for LLM-based ASR","display_name":"Distilling Conversations: Abstract Compression of Conversational Audio Context for LLM-based ASR","publication_year":2026,"publication_date":"2026-03-27","ids":{"openalex":"https://openalex.org/W7143511642","doi":"https://doi.org/10.48550/arxiv.2603.26246"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.26246","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.26246","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.26246","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130992606","display_name":"Shashi Kumar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kumar, Shashi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130938953","display_name":"Esa\u00fa Villatoro-Tello","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Villatoro-Tello, Esa\u00fa","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034706108","display_name":"Sergio Burdisso","orcid":"https://orcid.org/0000-0002-7694-6834"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Burdisso, Sergio","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130994577","display_name":"Kadri Hacioglu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hacioglu, Kadri","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130985294","display_name":"Thibault Ba\u00f1eras-Roux","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ba\u00f1eras-Roux, Thibault","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092874848","display_name":"Hasindri Watawana","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Watawana, Hasindri","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018275740","display_name":"Dairazalia S\u00e1nchez-Cort\u00e9s","orcid":"https://orcid.org/0000-0003-2429-6152"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sanchez-Cortes, Dairazalia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130943453","display_name":"Srikanth Madikeri","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Madikeri, Srikanth","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076409146","display_name":"Petr Motl\u00ed\u010dek","orcid":"https://orcid.org/0000-0001-6467-1119"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Motlicek, Petr","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130959441","display_name":"Andreas Stolcke","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stolcke, Andreas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9406999945640564,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9406999945640564,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.014299999922513962,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.010900000110268593,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6847000122070312},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.5507000088691711},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5440999865531921},{"id":"https://openalex.org/keywords/conversation","display_name":"Conversation","score":0.5422999858856201},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4927999973297119},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.4912000000476837},{"id":"https://openalex.org/keywords/compression","display_name":"Compression (physics)","score":0.4788999855518341},{"id":"https://openalex.org/keywords/limiting","display_name":"Limiting","score":0.4481000006198883}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7943999767303467},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7039999961853027},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6847000122070312},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.5507000088691711},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5440999865531921},{"id":"https://openalex.org/C2777200299","wikidata":"https://www.wikidata.org/wiki/Q52943","display_name":"Conversation","level":2,"score":0.5422999858856201},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4927999973297119},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.4912000000476837},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.4788999855518341},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.4481000006198883},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.42969998717308044},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4244000017642975},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4140999913215637},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.4020000100135803},{"id":"https://openalex.org/C157968479","wikidata":"https://www.wikidata.org/wiki/Q3079876","display_name":"Audio mining","level":4,"score":0.30880001187324524},{"id":"https://openalex.org/C13895895","wikidata":"https://www.wikidata.org/wiki/Q3270773","display_name":"Speech coding","level":2,"score":0.30300000309944153},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.2921000123023987},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.28929999470710754},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.2825999855995178},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.27639999985694885},{"id":"https://openalex.org/C165021410","wikidata":"https://www.wikidata.org/wiki/Q55564","display_name":"Lossy compression","level":2,"score":0.27549999952316284},{"id":"https://openalex.org/C35639132","wikidata":"https://www.wikidata.org/wiki/Q7452468","display_name":"Sequence labeling","level":3,"score":0.25999999046325684},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2556000053882599}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.26246","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.26246","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.26246","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.26246","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Standard":[0],"LLM-based":[1,29],"speech":[2],"recognition":[3,51],"systems":[4],"typically":[5],"process":[6],"utterances":[7],"in":[8],"isolation,":[9],"limiting":[10],"their":[11],"ability":[12],"to":[13,33],"leverage":[14],"conversational":[15,45],"context.":[16],"In":[17],"this":[18],"work,":[19],"we":[20,76],"study":[21],"whether":[22],"multimodal":[23],"context":[24,36,46,59],"from":[25],"prior":[26,86],"turns":[27,87],"improves":[28],"ASR":[30],"and":[31,104,134],"how":[32],"represent":[34],"that":[35],"efficiently.":[37],"We":[38,125],"find":[39],"that,":[40],"after":[41],"supervised":[42],"multi-turn":[43],"training,":[44],"mainly":[47],"helps":[48],"with":[49,70,88,119],"the":[50,63,82,108,114,131],"of":[52,85,92,113,116,130],"contextual":[53],"entities.":[54],"However,":[55],"conditioning":[56,118],"on":[57],"raw":[58],"is":[60],"expensive":[61],"because":[62],"prior-turn":[64,122],"audio":[65,83,123],"token":[66],"sequence":[67],"grows":[68],"rapidly":[69],"conversation":[71],"length.":[72],"To":[73],"address":[74],"this,":[75],"propose":[77],"Abstract":[78],"Compression,":[79],"which":[80],"replaces":[81],"portion":[84],"a":[89,120],"fixed":[90],"number":[91],"learned":[93],"latent":[94],"tokens":[95],"while":[96],"retaining":[97],"corresponding":[98],"transcripts":[99],"explicitly.":[100],"On":[101],"both":[102],"in-domain":[103],"out-of-domain":[105],"test":[106],"sets,":[107],"compressed":[109],"model":[110],"recovers":[111],"part":[112],"gains":[115],"raw-context":[117],"smaller":[121],"footprint.":[124],"also":[126],"provide":[127],"targeted":[128],"analyses":[129],"compression":[132],"setup":[133],"its":[135],"trade-offs.":[136]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-31T00:00:00"}
