{"id":"https://openalex.org/W4226269280","doi":"https://doi.org/10.1162/tacl_a_00491","title":"High Quality Rather than High Model Probability: Minimum Bayes Risk Decoding with Neural Metrics","display_name":"High Quality Rather than High Model Probability: Minimum Bayes Risk Decoding with Neural Metrics","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4226269280","doi":"https://doi.org/10.1162/tacl_a_00491"},"language":"en","primary_location":{"id":"doi:10.1162/tacl_a_00491","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00491","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00491/2037127/tacl_a_00491.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00491/2037127/tacl_a_00491.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5065526118","display_name":"Markus Freitag","orcid":"https://orcid.org/0000-0003-2428-0652"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Markus Freitag","raw_affiliation_strings":["Google Research, USA. ::freitag@google.com"],"affiliations":[{"raw_affiliation_string":"Google Research, USA. ::freitag@google.com","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065912572","display_name":"David Grangier","orcid":"https://orcid.org/0000-0002-8847-9532"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"David Grangier","raw_affiliation_strings":["Google Research, USA. grangier@google.com"],"affiliations":[{"raw_affiliation_string":"Google Research, USA. grangier@google.com","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065863466","display_name":"Qijun Tan","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Qijun Tan","raw_affiliation_strings":["Google Research, USA. qijuntan@google.com"],"affiliations":[{"raw_affiliation_string":"Google Research, USA. qijuntan@google.com","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024048679","display_name":"Bowen Liang","orcid":"https://orcid.org/0000-0002-9663-5056"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Bowen Liang","raw_affiliation_strings":["Google Research, USA. bowenl@google.com"],"affiliations":[{"raw_affiliation_string":"Google Research, USA. bowenl@google.com","institution_ids":["https://openalex.org/I1291425158"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5024048679","https://openalex.org/A5065526118","https://openalex.org/A5065863466","https://openalex.org/A5065912572"],"corresponding_institution_ids":["https://openalex.org/I1291425158"],"apc_list":null,"apc_paid":null,"fwci":3.184,"has_fulltext":true,"cited_by_count":25,"citation_normalized_percentile":{"value":0.92713137,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"10","issue":null,"first_page":"811","last_page":"825"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9631999731063843,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7801594734191895},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.7691560983657837},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.7635124921798706},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.757736086845398},{"id":"https://openalex.org/keywords/bayes-theorem","display_name":"Bayes' theorem","score":0.6684954762458801},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6563687920570374},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.5854705572128296},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5414755940437317},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5282677412033081},{"id":"https://openalex.org/keywords/beam-search","display_name":"Beam search","score":0.4572789669036865},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.44563910365104675},{"id":"https://openalex.org/keywords/neural-decoding","display_name":"Neural decoding","score":0.44435566663742065},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.4284643530845642},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.356611430644989},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.26980143785476685},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.23288178443908691},{"id":"https://openalex.org/keywords/search-algorithm","display_name":"Search algorithm","score":0.14920446276664734}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7801594734191895},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.7691560983657837},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.7635124921798706},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.757736086845398},{"id":"https://openalex.org/C207201462","wikidata":"https://www.wikidata.org/wiki/Q182505","display_name":"Bayes' theorem","level":3,"score":0.6684954762458801},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6563687920570374},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.5854705572128296},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5414755940437317},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5282677412033081},{"id":"https://openalex.org/C19889080","wikidata":"https://www.wikidata.org/wiki/Q2835852","display_name":"Beam search","level":3,"score":0.4572789669036865},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.44563910365104675},{"id":"https://openalex.org/C40743351","wikidata":"https://www.wikidata.org/wiki/Q7002049","display_name":"Neural decoding","level":3,"score":0.44435566663742065},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.4284643530845642},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.356611430644989},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.26980143785476685},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.23288178443908691},{"id":"https://openalex.org/C125583679","wikidata":"https://www.wikidata.org/wiki/Q755673","display_name":"Search algorithm","level":2,"score":0.14920446276664734},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1162/tacl_a_00491","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00491","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00491/2037127/tacl_a_00491.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:b8d9049462604a6ca20703ef34c5a5e0","is_oa":true,"landing_page_url":"https://doaj.org/article/b8d9049462604a6ca20703ef34c5a5e0","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Transactions of the Association for Computational Linguistics, Vol 10 (2023)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1162/tacl_a_00491","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00491","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00491/2037127/tacl_a_00491.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4226269280.pdf","grobid_xml":"https://content.openalex.org/works/W4226269280.grobid-xml"},"referenced_works_count":58,"referenced_works":["https://openalex.org/W1528470941","https://openalex.org/W1583837637","https://openalex.org/W1654441844","https://openalex.org/W1967573895","https://openalex.org/W1988520084","https://openalex.org/W1993666847","https://openalex.org/W2100238596","https://openalex.org/W2101105183","https://openalex.org/W2108984739","https://openalex.org/W2137143056","https://openalex.org/W2142112143","https://openalex.org/W2164732909","https://openalex.org/W2250342921","https://openalex.org/W2251367463","https://openalex.org/W2525778437","https://openalex.org/W2559655401","https://openalex.org/W2598654328","https://openalex.org/W2600463316","https://openalex.org/W2612690371","https://openalex.org/W2928941594","https://openalex.org/W2962890089","https://openalex.org/W2963250244","https://openalex.org/W2963532001","https://openalex.org/W2963807318","https://openalex.org/W2964190861","https://openalex.org/W2970279348","https://openalex.org/W2970986500","https://openalex.org/W3035252911","https://openalex.org/W3092058109","https://openalex.org/W3103450644","https://openalex.org/W3105214104","https://openalex.org/W3118026775","https://openalex.org/W3159892921","https://openalex.org/W3176846585","https://openalex.org/W3187364184","https://openalex.org/W3211758383","https://openalex.org/W4205384019","https://openalex.org/W4287115969","https://openalex.org/W4287597717","https://openalex.org/W4287633642","https://openalex.org/W6678262379","https://openalex.org/W6679434410","https://openalex.org/W6679436768","https://openalex.org/W6680129566","https://openalex.org/W6698348375","https://openalex.org/W6722524744","https://openalex.org/W6737778391","https://openalex.org/W6739901393","https://openalex.org/W6755207826","https://openalex.org/W6760633627","https://openalex.org/W6761205521","https://openalex.org/W6777499153","https://openalex.org/W6784336138","https://openalex.org/W6784395031","https://openalex.org/W6788156848","https://openalex.org/W6789259428","https://openalex.org/W6799091307","https://openalex.org/W7074581528"],"related_works":["https://openalex.org/W2098373948","https://openalex.org/W3204412157","https://openalex.org/W1534867933","https://openalex.org/W2587713090","https://openalex.org/W2963141266","https://openalex.org/W2896393657","https://openalex.org/W2744712844","https://openalex.org/W2090610152","https://openalex.org/W2742276804","https://openalex.org/W2903036216"],"abstract_inverted_index":{"Abstract":[0],"In":[1,30],"Neural":[2],"Machine":[3],"Translation,":[4],"it":[5],"is":[6,120],"typically":[7],"assumed":[8],"that":[9,39,97],"the":[10,13,20,23,77,80,87,90,98],"sentence":[11],"with":[12,22,79,89,105,122],"highest":[14,24,81,91],"estimated":[15,92],"probability":[16],"should":[17],"also":[18],"be":[19],"translation":[21,43,64,103],"quality":[25,44,65],"as":[26,66],"measured":[27],"by":[28,140],"humans.":[29],"this":[31,35],"work,":[32],"we":[33],"question":[34],"assumption":[36],"and":[37,42,136],"show":[38,96],"model":[40,82,104,134],"estimates":[41],"only":[45],"vaguely":[46],"correlate.":[47],"We":[48],"apply":[49],"Minimum":[50],"Bayes":[51],"Risk":[52],"(MBR)":[53],"decoding":[54,85],"on":[55],"unbiased":[56],"samples":[57],"to":[58,71],"optimize":[59],"diverse":[60],"automated":[61],"metrics":[62,142],"of":[63,75,100],"an":[67],"alternative":[68],"inference":[69],"strategy":[70],"beam":[72],"search.":[73],"Instead":[74],"targeting":[76],"hypotheses":[78,88],"probability,":[83],"MBR":[84],"extracts":[86],"quality.":[93],"Our":[94],"experiments":[95],"combination":[99],"a":[101,106],"neural":[102,107],"reference-based":[108],"metric,":[109],"Bleurt,":[110],"results":[111],"in":[112,115],"significant":[113],"improvement":[114,119],"human":[116],"evaluations.":[117],"This":[118],"obtained":[121],"translations":[123,130],"different":[124],"from":[125],"classical":[126],"beam-search":[127],"output:":[128],"These":[129],"have":[131],"much":[132],"lower":[133],"likelihood":[135],"are":[137],"less":[138],"favored":[139],"surface":[141],"like":[143],"Bleu.":[144]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":17},{"year":2022,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
