{"id":"https://openalex.org/W2963569619","doi":"https://doi.org/10.18653/v1/p19-1098","title":"Improving the Similarity Measure of Determinantal Point Processes for Extractive Multi-Document Summarization","display_name":"Improving the Similarity Measure of Determinantal Point Processes for Extractive Multi-Document Summarization","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2963569619","doi":"https://doi.org/10.18653/v1/p19-1098","mag":"2963569619"},"language":"en","primary_location":{"id":"doi:10.18653/v1/p19-1098","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1098","pdf_url":"https://www.aclweb.org/anthology/P19-1098.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/P19-1098.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036306083","display_name":"Sangwoo Cho","orcid":null},"institutions":[{"id":"https://openalex.org/I106165777","display_name":"University of Central Florida","ror":"https://ror.org/036nfer12","country_code":"US","type":"education","lineage":["https://openalex.org/I106165777"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sangwoo Cho","raw_affiliation_strings":["Computer Science Department University of Central Florida, Orlando, FL 32816, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science Department University of Central Florida, Orlando, FL 32816, USA","institution_ids":["https://openalex.org/I106165777"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056430376","display_name":"Logan Lebanoff","orcid":"https://orcid.org/0000-0001-7079-0210"},"institutions":[{"id":"https://openalex.org/I106165777","display_name":"University of Central Florida","ror":"https://ror.org/036nfer12","country_code":"US","type":"education","lineage":["https://openalex.org/I106165777"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Logan Lebanoff","raw_affiliation_strings":["Computer Science Department University of Central Florida, Orlando, FL 32816, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science Department University of Central Florida, Orlando, FL 32816, USA","institution_ids":["https://openalex.org/I106165777"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076117344","display_name":"Hassan Foroosh","orcid":"https://orcid.org/0000-0002-7601-8165"},"institutions":[{"id":"https://openalex.org/I106165777","display_name":"University of Central Florida","ror":"https://ror.org/036nfer12","country_code":"US","type":"education","lineage":["https://openalex.org/I106165777"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hassan Foroosh","raw_affiliation_strings":["Computer Science Department University of Central Florida, Orlando, FL 32816, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science Department University of Central Florida, Orlando, FL 32816, USA","institution_ids":["https://openalex.org/I106165777"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100394562","display_name":"Fei Liu","orcid":"https://orcid.org/0000-0001-7141-5105"},"institutions":[{"id":"https://openalex.org/I106165777","display_name":"University of Central Florida","ror":"https://ror.org/036nfer12","country_code":"US","type":"education","lineage":["https://openalex.org/I106165777"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Fei Liu","raw_affiliation_strings":["Computer Science Department University of Central Florida, Orlando, FL 32816, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science Department University of Central Florida, Orlando, FL 32816, USA","institution_ids":["https://openalex.org/I106165777"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5036306083"],"corresponding_institution_ids":["https://openalex.org/I106165777"],"apc_list":null,"apc_paid":null,"fwci":7.6591,"has_fulltext":true,"cited_by_count":62,"citation_normalized_percentile":{"value":0.97783142,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1027","last_page":"1038"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.9620770215988159},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.7868736982345581},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7737400531768799},{"id":"https://openalex.org/keywords/similarity-measure","display_name":"Similarity measure","score":0.5994244813919067},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.5906692147254944},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5537049174308777},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5501459836959839},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5030393004417419},{"id":"https://openalex.org/keywords/semantic-similarity","display_name":"Semantic similarity","score":0.4878937900066376},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.4805765151977539},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4281834363937378},{"id":"https://openalex.org/keywords/determinantal-point-process","display_name":"Determinantal point process","score":0.42731690406799316},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4021323323249817},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.34581756591796875}],"concepts":[{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.9620770215988159},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.7868736982345581},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7737400531768799},{"id":"https://openalex.org/C2776517306","wikidata":"https://www.wikidata.org/wiki/Q29017317","display_name":"Similarity measure","level":2,"score":0.5994244813919067},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.5906692147254944},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5537049174308777},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5501459836959839},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5030393004417419},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.4878937900066376},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.4805765151977539},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4281834363937378},{"id":"https://openalex.org/C72010251","wikidata":"https://www.wikidata.org/wiki/Q5265688","display_name":"Determinantal point process","level":4,"score":0.42731690406799316},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4021323323249817},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.34581756591796875},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C64812099","wikidata":"https://www.wikidata.org/wiki/Q176604","display_name":"Random matrix","level":3,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/p19-1098","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1098","pdf_url":"https://www.aclweb.org/anthology/P19-1098.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/p19-1098","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1098","pdf_url":"https://www.aclweb.org/anthology/P19-1098.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.5299999713897705}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2963569619.pdf","grobid_xml":"https://content.openalex.org/works/W2963569619.grobid-xml"},"referenced_works_count":76,"referenced_works":["https://openalex.org/W41776650","https://openalex.org/W607342991","https://openalex.org/W1488425980","https://openalex.org/W1544827683","https://openalex.org/W1840435438","https://openalex.org/W1939882552","https://openalex.org/W1962684803","https://openalex.org/W1975579663","https://openalex.org/W1976806664","https://openalex.org/W1989420837","https://openalex.org/W1999447745","https://openalex.org/W2001135856","https://openalex.org/W2036371118","https://openalex.org/W2083305840","https://openalex.org/W2103339462","https://openalex.org/W2115857089","https://openalex.org/W2115937944","https://openalex.org/W2122311631","https://openalex.org/W2133182690","https://openalex.org/W2138556193","https://openalex.org/W2148404145","https://openalex.org/W2150869743","https://openalex.org/W2151258001","https://openalex.org/W2154652894","https://openalex.org/W2182572585","https://openalex.org/W2250483006","https://openalex.org/W2250829779","https://openalex.org/W2250873048","https://openalex.org/W2251384446","https://openalex.org/W2251654079","https://openalex.org/W2251750971","https://openalex.org/W2251803607","https://openalex.org/W2293771131","https://openalex.org/W2307381258","https://openalex.org/W2341349540","https://openalex.org/W2404691574","https://openalex.org/W2574535369","https://openalex.org/W2606974598","https://openalex.org/W2609482285","https://openalex.org/W2612675303","https://openalex.org/W2741375528","https://openalex.org/W2768957049","https://openalex.org/W2785994986","https://openalex.org/W2798416089","https://openalex.org/W2808293684","https://openalex.org/W2836428027","https://openalex.org/W2889518897","https://openalex.org/W2949615363","https://openalex.org/W2952138241","https://openalex.org/W2952215948","https://openalex.org/W2962853356","https://openalex.org/W2962946054","https://openalex.org/W2962972512","https://openalex.org/W2962985882","https://openalex.org/W2963125472","https://openalex.org/W2963227052","https://openalex.org/W2963385935","https://openalex.org/W2963458607","https://openalex.org/W2963548995","https://openalex.org/W2963607157","https://openalex.org/W2963676814","https://openalex.org/W2963703618","https://openalex.org/W2963846996","https://openalex.org/W2963882968","https://openalex.org/W2963919999","https://openalex.org/W2963929190","https://openalex.org/W2964144561","https://openalex.org/W2964213257","https://openalex.org/W2964285114","https://openalex.org/W3101913037","https://openalex.org/W3103014337","https://openalex.org/W3104033643","https://openalex.org/W3138773240","https://openalex.org/W4292356436","https://openalex.org/W4298077084","https://openalex.org/W4313908941"],"related_works":["https://openalex.org/W2366403280","https://openalex.org/W1495108544","https://openalex.org/W2091301346","https://openalex.org/W3148229873","https://openalex.org/W4389760904","https://openalex.org/W2150160875","https://openalex.org/W4242223894","https://openalex.org/W4306886878","https://openalex.org/W2973759123","https://openalex.org/W1517524280"],"abstract_inverted_index":{"The":[0,68],"most":[1],"important":[2],"obstacles":[3,21],"facing":[4],"multidocument":[5],"summarization":[6,57,98],"include":[7],"excessive":[8],"redundancy":[9,71],"in":[10],"source":[11],"descriptions":[12],"and":[13,81],"the":[14],"looming":[15],"shortage":[16],"of":[17,75],"training":[18],"data.":[19],"These":[20],"prevent":[22],"encoder-decoder":[23],"models":[24],"from":[25],"being":[26],"used":[27],"directly,":[28],"but":[29],"optimization-based":[30],"methods":[31],"such":[32],"as":[33],"determinantal":[34],"point":[35],"processes":[36],"(DPPs)":[37],"are":[38,105],"known":[39],"to":[40,49],"handle":[41],"them":[42],"well.":[43],"In":[44],"this":[45],"paper":[46],"we":[47],"seek":[48],"strengthen":[50],"a":[51,60,73],"DPP-based":[52],"method":[53],"for":[54,108],"extractive":[55],"multi-document":[56],"by":[58,65,112],"presenting":[59],"novel":[61],"similarity":[62,92],"measure":[63,93],"inspired":[64],"capsule":[66],"networks.":[67],"approach":[69],"measures":[70],"between":[72],"pair":[74],"sentences":[76],"based":[77],"on":[78,100],"surface":[79],"form":[80],"semantic":[82],"information.":[83],"We":[84],"show":[85],"that":[86],"our":[87],"DPP":[88],"system":[89],"with":[90],"improved":[91],"performs":[94],"competitively,":[95],"outperforming":[96],"strong":[97],"baselines":[99],"benchmark":[101],"datasets.":[102],"Our":[103],"findings":[104],"particularly":[106],"meaningful":[107],"summarizing":[109],"documents":[110],"created":[111],"multiple":[113],"authors":[114],"containing":[115],"redundant":[116],"yet":[117],"lexically":[118],"diverse":[119],"expressions.":[120],"1":[121]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":13},{"year":2021,"cited_by_count":18},{"year":2020,"cited_by_count":15},{"year":2019,"cited_by_count":7}],"updated_date":"2026-04-11T08:14:18.477133","created_date":"2025-10-10T00:00:00"}
