{"id":"https://openalex.org/W2913218482","doi":"https://doi.org/10.1145/3308558.3313415","title":"Improving Neural Response Diversity with Frequency-Aware Cross-Entropy Loss","display_name":"Improving Neural Response Diversity with Frequency-Aware Cross-Entropy Loss","publication_year":2019,"publication_date":"2019-05-13","ids":{"openalex":"https://openalex.org/W2913218482","doi":"https://doi.org/10.1145/3308558.3313415","mag":"2913218482"},"language":"en","primary_location":{"id":"doi:10.1145/3308558.3313415","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3308558.3313415","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The World Wide Web Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3308558.3313415","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Shaojie Jiang","orcid":null},"institutions":[{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Shaojie Jiang","raw_affiliation_strings":["University of Amsterdam, Netherlands"],"affiliations":[{"raw_affiliation_string":"University of Amsterdam, Netherlands","institution_ids":["https://openalex.org/I887064364"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Pengjie Ren","orcid":null},"institutions":[{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Pengjie Ren","raw_affiliation_strings":["University of Amsterdam, Netherlands"],"affiliations":[{"raw_affiliation_string":"University of Amsterdam, Netherlands","institution_ids":["https://openalex.org/I887064364"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Christof Monz","orcid":null},"institutions":[{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Christof Monz","raw_affiliation_strings":["University of Amsterdam, Netherlands"],"affiliations":[{"raw_affiliation_string":"University of Amsterdam, Netherlands","institution_ids":["https://openalex.org/I887064364"]}]},{"author_position":"last","author":{"id":null,"display_name":"Maarten de Rijke","orcid":null},"institutions":[{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Maarten de Rijke","raw_affiliation_strings":["University of Amsterdam, Netherlands"],"affiliations":[{"raw_affiliation_string":"University of Amsterdam, Netherlands","institution_ids":["https://openalex.org/I887064364"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I887064364"],"apc_list":null,"apc_paid":null,"fwci":1.8786,"has_fulltext":true,"cited_by_count":32,"citation_normalized_percentile":{"value":0.8919039,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2879","last_page":"2885"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.6575999855995178},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.5440000295639038},{"id":"https://openalex.org/keywords/weighting","display_name":"Weighting","score":0.5392000079154968},{"id":"https://openalex.org/keywords/loss-function","display_name":"Loss function","score":0.531499981880188},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.49160000681877136},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.4311999976634979}],"concepts":[{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.6575999855995178},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6399999856948853},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.5440000295639038},{"id":"https://openalex.org/C183115368","wikidata":"https://www.wikidata.org/wiki/Q856577","display_name":"Weighting","level":2,"score":0.5392000079154968},{"id":"https://openalex.org/C105951970","wikidata":"https://www.wikidata.org/wiki/Q1036748","display_name":"Loss function","level":4,"score":0.531499981880188},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.49160000681877136},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4447999894618988},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.4311999976634979},{"id":"https://openalex.org/C2781316041","wikidata":"https://www.wikidata.org/wiki/Q1230584","display_name":"Diversity (politics)","level":2,"score":0.3862000107765198},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35109999775886536},{"id":"https://openalex.org/C13355873","wikidata":"https://www.wikidata.org/wiki/Q2920850","display_name":"Connection (principal bundle)","level":2,"score":0.32670000195503235},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.32179999351501465},{"id":"https://openalex.org/C70136482","wikidata":"https://www.wikidata.org/wiki/Q13583781","display_name":"A-weighting","level":3,"score":0.3206000030040741},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3028999865055084},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2705000042915344}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1145/3308558.3313415","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3308558.3313415","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The World Wide Web Conference","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1902.09191","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1902.09191","pdf_url":"https://arxiv.org/pdf/1902.09191","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:dare.uva.nl:openaire/56256d88-fab1-43cc-8a74-74b11de49c1d","is_oa":true,"landing_page_url":"https://handle.uba.uva.nl/personal/pure/en/publications/improving-neural-response-diversity-with-frequencyaware-crossentropy-loss(56256d88-fab1-43cc-8a74-74b11de49c1d).html","pdf_url":"https://pure.uva.nl/ws/files/42480648/p2879_jiang.pdf","source":{"id":"https://openalex.org/S4306400088","display_name":"UvA-DARE (University of Amsterdam)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I887064364","host_organization_name":"University of Amsterdam","host_organization_lineage":["https://openalex.org/I887064364"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Jiang, S, Ren, P, Monz, C & de Rijke, M 2019, Improving Neural Response Diversity with Frequency-Aware Cross-Entropy Loss. in The Web Conference 2019 : proceedings of the World Wide Web Conference WWW 2019 : May 13-17, 2019, San Francisco, CA, USA. Association for Computing Machinery, New York, pp. 2879-2885, 2019 World Wide Web Conference, WWW 2019, San Francisco, United States, 13/05/19. https://doi.org/10.1145/3308558.3313415","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:uvapub:oai:dare.uva.nl:publications/56256d88-fab1-43cc-8a74-74b11de49c1d","is_oa":true,"landing_page_url":"https://dare.uva.nl/personal/pure/en/publications/improving-neural-response-diversity-with-frequencyaware-crossentropy-loss(56256d88-fab1-43cc-8a74-74b11de49c1d).html","pdf_url":"https://dare.uva.nl/personal/pure/en/publications/improving-neural-response-diversity-with-frequencyaware-crossentropy-loss(56256d88-fab1-43cc-8a74-74b11de49c1d).html","source":{"id":"https://openalex.org/S4306401843","display_name":"Data Archiving and Networked Services (DANS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1322597698","host_organization_name":"Royal Netherlands Academy of Arts and Sciences","host_organization_lineage":["https://openalex.org/I1322597698"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"The Web Conference 2019: proceedings of the World Wide Web Conference WWW 2019 : May 13-17, 2019, San Francisco, CA, USA, 2879 - 2885","raw_type":"info:eu-repo/semantics/conferencepaper"},{"id":"pmh:oai:dare.uva.nl:publications/56256d88-fab1-43cc-8a74-74b11de49c1d","is_oa":true,"landing_page_url":"https://hdl.handle.net/11245.1/56256d88-fab1-43cc-8a74-74b11de49c1d","pdf_url":null,"source":{"id":"https://openalex.org/S4306400088","display_name":"UvA-DARE (University of Amsterdam)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I887064364","host_organization_name":"University of Amsterdam","host_organization_lineage":["https://openalex.org/I887064364"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Jiang, S, Ren, P, Monz, C & de Rijke, M 2019, Improving Neural Response Diversity with Frequency-Aware Cross-Entropy Loss. in The Web Conference 2019 : proceedings of the World Wide Web Conference WWW 2019 : May 13-17, 2019, San Francisco, CA, USA. Association for Computing Machinery, New York, pp. 2879-2885, 2019 World Wide Web Conference, WWW 2019, San Francisco, United States, 13/05/19. https://doi.org/10.1145/3308558.3313415","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":{"id":"doi:10.1145/3308558.3313415","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3308558.3313415","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The World Wide Web Conference","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8589651859","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320322725","funder_display_name":"China Scholarship Council"}],"funders":[{"id":"https://openalex.org/F4320321182","display_name":"VSNU Vereniging van Universiteiten","ror":"https://ror.org/05wvdt748"},{"id":"https://openalex.org/F4320322725","display_name":"China Scholarship Council","ror":"https://ror.org/04atp4p48"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W35652532","https://openalex.org/W635530177","https://openalex.org/W1518951372","https://openalex.org/W2101105183","https://openalex.org/W2962717182","https://openalex.org/W2962814079","https://openalex.org/W2962974452","https://openalex.org/W2963206148","https://openalex.org/W2963712524","https://openalex.org/W2963903950"],"related_works":[],"abstract_inverted_index":{"Sequence-to-Sequence":[0],"(Seq2Seq)":[1],"models":[2],"have":[3],"achieved":[4],"encouraging":[5],"performance":[6],"on":[7,105,110],"the":[8,31,40,58,61,71,95,115,124],"dialogue":[9],"response":[10,16,130],"generation":[11,17,131],"task.":[12],"However,":[13],"existing":[14,127],"Seq2Seq-based":[15],"methods":[18],"suffer":[19],"from":[20],"a":[21,86,101],"low-diversity":[22,41,81],"problem:":[23],"they":[24],"frequently":[25],"generate":[26],"generic":[27],"responses,":[28],"which":[29,78],"make":[30],"conversation":[32],"less":[33],"interesting.":[34],"In":[35],"this":[36],"paper,":[37],"we":[38,55],"address":[39],"problem":[42],"by":[43,99],"investigating":[44],"its":[45],"connection":[46],"with":[47],"model":[48],"over-confidence":[49],"reflected":[50],"in":[51,80,133],"predicted":[52],"distributions.":[53],"Specifically,":[54],"first":[56],"analyze":[57],"influence":[59],"of":[60,126,135],"commonly":[62],"used":[63],"Cross-Entropy":[64,88],"(CE)":[65],"loss":[66,73,90,97,117],"function,":[67],"and":[68,138],"find":[69],"that":[70,92,114],"CE":[72,96],"function":[74,91,98,118],"prefers":[75],"high-frequency":[76],"tokens,":[77],"results":[79],"responses.":[82],"We":[83],"then":[84],"propose":[85],"Frequency-Aware":[87],"(FACE)":[89],"improves":[93],"over":[94],"incorporating":[100],"weighting":[102],"mechanism":[103],"conditioned":[104],"token":[106],"frequency.":[107],"Extensive":[108],"experiments":[109],"benchmark":[111],"datasets":[112],"show":[113],"FACE":[116],"is":[119],"able":[120],"to":[121],"substantially":[122],"improve":[123],"diversity":[125],"state-of-the-art":[128],"Seq2Seq":[129],"methods,":[132],"terms":[134],"both":[136],"automatic":[137],"human":[139],"evaluations.":[140]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":9},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2019-02-21T00:00:00"}
