{"id":"https://openalex.org/W7153026408","doi":"https://doi.org/10.48550/arxiv.2604.07354","title":"Contextual Earnings-22: A Speech Recognition Benchmark with Custom Vocabulary in the Wild","display_name":"Contextual Earnings-22: A Speech Recognition Benchmark with Custom Vocabulary in the Wild","publication_year":2026,"publication_date":"2026-03-28","ids":{"openalex":"https://openalex.org/W7153026408","doi":"https://doi.org/10.48550/arxiv.2604.07354"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.07354","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07354","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.07354","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5119695000","display_name":"Berkin Durmus","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Durmus, Berkin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133390732","display_name":"Chen Cen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cen, Chen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119694998","display_name":"Eduardo Pacheco","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pacheco, Eduardo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133392806","display_name":"Arda Okan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Okan, Arda","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5119694999","display_name":"Atila Orhon","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Orhon, Atila","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5119695000"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.5393999814987183,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.5393999814987183,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.14949999749660492,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.06729999929666519,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.8241000175476074},{"id":"https://openalex.org/keywords/usability","display_name":"Usability","score":0.6674000024795532},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.6166999936103821},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.600600004196167},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.47920000553131104}],"concepts":[{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.8241000175476074},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.75},{"id":"https://openalex.org/C170130773","wikidata":"https://www.wikidata.org/wiki/Q216378","display_name":"Usability","level":2,"score":0.6674000024795532},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.6166999936103821},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.600600004196167},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5976999998092651},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5184000134468079},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.47920000553131104},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4307999908924103},{"id":"https://openalex.org/C2778571376","wikidata":"https://www.wikidata.org/wiki/Q1355821","display_name":"Frontier","level":2,"score":0.28189998865127563},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.2694000005722046}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.07354","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07354","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.07354","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.07354","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.6984214186668396,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"accuracy":[1,120],"frontier":[2],"of":[3,63],"speech-to-text":[4],"systems":[5],"has":[6,57],"plateaued":[7],"on":[8,60,68],"academic":[9],"benchmarks.1":[10],"In":[11],"contrast,":[12],"industrial":[13],"benchmarks":[14,35],"and":[15,52,94,109,117],"adoption":[16],"in":[17],"high-stakes":[18],"domains":[19],"suggest":[20],"otherwise.":[21],"We":[22,76,98],"hypothesize":[23],"that":[24,43,56],"the":[25,29,61],"primary":[26],"difference":[27],"between":[28],"two":[30,104],"is":[31,44,72],"contextual":[32,69],"conditioning:":[33],"Academic":[34],"are":[36],"dominated":[37],"by":[38],"frequently":[39],"encountered":[40],"general":[41],"vocabulary":[42,55,89],"relatively":[45],"easy":[46],"to":[47,91,125],"recognize":[48],"compared":[49],"with":[50,86],"rare":[51],"context-defined":[53],"custom":[54,88],"disproportionate":[58],"impact":[59],"usability":[62],"speech":[64],"transcripts.":[65],"Despite":[66],"progress":[67],"speech-to-text,":[70],"there":[71],"no":[73],"standardized":[74],"benchmark.":[75],"introduce":[77],"Contextual":[78],"Earnings-22,":[79,85],"an":[80],"open":[81],"dataset":[82],"built":[83],"upon":[84],"realistic":[87],"contexts":[90],"foster":[92],"research":[93],"reveal":[95],"latent":[96],"progress.":[97],"set":[99],"six":[100],"strong":[101],"baselines":[102],"for":[103],"dominant":[105],"approaches:":[106],"keyword":[107,110],"prompting":[108],"boosting.":[111],"Experiments":[112],"show":[113],"both":[114],"reach":[115],"comparable":[116],"significantly":[118],"improved":[119],"when":[121],"scaled":[122],"from":[123],"proof-of-concept":[124],"large-scale":[126],"systems.":[127]},"counts_by_year":[],"updated_date":"2026-04-11T06:19:08.300824","created_date":"2026-04-11T00:00:00"}
