{"id":"https://openalex.org/W2624054275","doi":"https://doi.org/10.3390/info8020064","title":"Identifying High Quality Document\u2013Summary Pairs through Text Matching","display_name":"Identifying High Quality Document\u2013Summary Pairs through Text Matching","publication_year":2017,"publication_date":"2017-06-12","ids":{"openalex":"https://openalex.org/W2624054275","doi":"https://doi.org/10.3390/info8020064","mag":"2624054275"},"language":"en","primary_location":{"id":"doi:10.3390/info8020064","is_oa":true,"landing_page_url":"https://doi.org/10.3390/info8020064","pdf_url":"https://www.mdpi.com/2078-2489/8/2/64/pdf?version=1497237645","source":{"id":"https://openalex.org/S4210219776","display_name":"Information","issn_l":"2078-2489","issn":["2078-2489"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Information","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2078-2489/8/2/64/pdf?version=1497237645","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027262293","display_name":"Yongshuai Hou","orcid":"https://orcid.org/0000-0001-6994-8295"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongshuai Hou","raw_affiliation_strings":["Intelligence Computing Research Center, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligence Computing Research Center, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008082945","display_name":"Yang Xiang","orcid":"https://orcid.org/0000-0001-9714-1210"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yang Xiang","raw_affiliation_strings":["Intelligence Computing Research Center, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligence Computing Research Center, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014238603","display_name":"Buzhou Tang","orcid":"https://orcid.org/0000-0003-0271-8246"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Buzhou Tang","raw_affiliation_strings":["Intelligence Computing Research Center, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligence Computing Research Center, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101895423","display_name":"Qingcai Chen","orcid":"https://orcid.org/0000-0001-8473-7293"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qingcai Chen","raw_affiliation_strings":["Intelligence Computing Research Center, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligence Computing Research Center, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100424254","display_name":"Xiaolong Wang","orcid":"https://orcid.org/0000-0001-9003-4252"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaolong Wang","raw_affiliation_strings":["Intelligence Computing Research Center, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligence Computing Research Center, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5040633442","display_name":"Fangze Zhu","orcid":"https://orcid.org/0000-0002-7535-7552"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fangze Zhu","raw_affiliation_strings":["Intelligence Computing Research Center, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligence Computing Research Center, Harbin Institute of Technology Shenzhen Graduate School, Shenzhen 518055, China","institution_ids":["https://openalex.org/I204983213"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5008082945"],"corresponding_institution_ids":["https://openalex.org/I204983213"],"apc_list":{"value":1400,"currency":"CHF","value_usd":1515},"apc_paid":{"value":1400,"currency":"CHF","value_usd":1515},"fwci":0.413,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.7136719,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"8","issue":"2","first_page":"64","last_page":"64"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.9082167744636536},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8250046372413635},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.7016312479972839},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6146050095558167},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6126335859298706},{"id":"https://openalex.org/keywords/test-set","display_name":"Test set","score":0.5487931966781616},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5164918899536133},{"id":"https://openalex.org/keywords/multi-document-summarization","display_name":"Multi-document summarization","score":0.48332810401916504},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.46345704793930054},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4514712691307068},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.44517287611961365},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.4416097402572632},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.4383810758590698},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.43655329942703247},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4107927680015564}],"concepts":[{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.9082167744636536},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8250046372413635},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.7016312479972839},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6146050095558167},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6126335859298706},{"id":"https://openalex.org/C169903167","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Test set","level":2,"score":0.5487931966781616},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5164918899536133},{"id":"https://openalex.org/C134714966","wikidata":"https://www.wikidata.org/wiki/Q6934448","display_name":"Multi-document summarization","level":3,"score":0.48332810401916504},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.46345704793930054},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4514712691307068},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.44517287611961365},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.4416097402572632},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.4383810758590698},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.43655329942703247},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4107927680015564},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C111368507","wikidata":"https://www.wikidata.org/wiki/Q43518","display_name":"Oceanography","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3390/info8020064","is_oa":true,"landing_page_url":"https://doi.org/10.3390/info8020064","pdf_url":"https://www.mdpi.com/2078-2489/8/2/64/pdf?version=1497237645","source":{"id":"https://openalex.org/S4210219776","display_name":"Information","issn_l":"2078-2489","issn":["2078-2489"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Information","raw_type":"journal-article"},{"id":"pmh:oai:mdpi.com:/2078-2489/8/2/64/","is_oa":true,"landing_page_url":"https://dx.doi.org/10.3390/info8020064","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Information; Volume 8; Issue 2; Pages: 64","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.3390/info8020064","is_oa":true,"landing_page_url":"https://doi.org/10.3390/info8020064","pdf_url":"https://www.mdpi.com/2078-2489/8/2/64/pdf?version=1497237645","source":{"id":"https://openalex.org/S4210219776","display_name":"Information","issn_l":"2078-2489","issn":["2078-2489"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Information","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.8100000023841858,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G1422164818","display_name":null,"funder_award_id":"JCYJ20140417172417105","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2060668466","display_name":null,"funder_award_id":"61473101","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2350075274","display_name":"\u9762\u5411\u771f\u5b9e\u73af\u5883\u7684\u5f02\u6784\u4fe1\u606f\u4ea4\u4e92\u5f0f\u95ee\u7b54\u7406\u8bba\u4e0e\u65b9\u6cd5\u7814\u7a76","funder_award_id":"61272383","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3881918265","display_name":null,"funder_award_id":"2015AA015405","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4243412236","display_name":null,"funder_award_id":"863 Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7128034784","display_name":null,"funder_award_id":"61402128","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8797872116","display_name":null,"funder_award_id":"JCYJ20140508161040764","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320316083","display_name":"Tencent","ror":"https://ror.org/00hhjss72"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335773","display_name":"National High-tech Research and Development Program","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2624054275.pdf","grobid_xml":"https://content.openalex.org/works/W2624054275.grobid-xml"},"referenced_works_count":63,"referenced_works":["https://openalex.org/W168564468","https://openalex.org/W1495207358","https://openalex.org/W1566139570","https://openalex.org/W1832693441","https://openalex.org/W1843891098","https://openalex.org/W1880262756","https://openalex.org/W1924770834","https://openalex.org/W1939882552","https://openalex.org/W2056609756","https://openalex.org/W2062227835","https://openalex.org/W2063392856","https://openalex.org/W2064675550","https://openalex.org/W2078841894","https://openalex.org/W2099592858","https://openalex.org/W2101234009","https://openalex.org/W2102269292","https://openalex.org/W2110693578","https://openalex.org/W2118463056","https://openalex.org/W2119821739","https://openalex.org/W2123086176","https://openalex.org/W2133197587","https://openalex.org/W2133564696","https://openalex.org/W2143205289","https://openalex.org/W2144270295","https://openalex.org/W2147152072","https://openalex.org/W2158997610","https://openalex.org/W2165612380","https://openalex.org/W2222491148","https://openalex.org/W2248073783","https://openalex.org/W2249237221","https://openalex.org/W2250483006","https://openalex.org/W2250694912","https://openalex.org/W2250966211","https://openalex.org/W2251394420","https://openalex.org/W2251478476","https://openalex.org/W2251911042","https://openalex.org/W2272941681","https://openalex.org/W2293778248","https://openalex.org/W2294136999","https://openalex.org/W2307381258","https://openalex.org/W2317879529","https://openalex.org/W2341401723","https://openalex.org/W2427312199","https://openalex.org/W2468484304","https://openalex.org/W2507634323","https://openalex.org/W2511929605","https://openalex.org/W2512531235","https://openalex.org/W2517782820","https://openalex.org/W2594895664","https://openalex.org/W2951359136","https://openalex.org/W2951777553","https://openalex.org/W2962965405","https://openalex.org/W2962996600","https://openalex.org/W2963929190","https://openalex.org/W2964259363","https://openalex.org/W3101913037","https://openalex.org/W4231510805","https://openalex.org/W4239510810","https://openalex.org/W6639619044","https://openalex.org/W6675354045","https://openalex.org/W6682631176","https://openalex.org/W6694408396","https://openalex.org/W6697028822"],"related_works":["https://openalex.org/W2093597205","https://openalex.org/W2389846579","https://openalex.org/W2008129036","https://openalex.org/W2392495745","https://openalex.org/W132250100","https://openalex.org/W2386445476","https://openalex.org/W2968364752","https://openalex.org/W169063832","https://openalex.org/W2238929664","https://openalex.org/W2725657302"],"abstract_inverted_index":{"Text":[0],"summarization":[1],"namely,":[2],"automatically":[3],"generating":[4],"a":[5,9,13,24,38,53,66,71],"short":[6],"summary":[7],"of":[8,40,83,94],"given":[10],"document,":[11,96],"is":[12,36],"difficult":[14],"task":[15],"in":[16,109],"natural":[17],"language":[18],"processing.":[19],"Nowadays,":[20],"deep":[21,55],"learning":[22,56],"as":[23],"new":[25],"technique":[26],"has":[27],"gradually":[28],"been":[29],"deployed":[30],"for":[31,45,64],"text":[32],"summarization,":[33],"but":[34],"there":[35],"still":[37],"lack":[39],"large-scale":[41,67],"high":[42,60],"quality":[43,61,82],"datasets":[44],"this":[46,49],"technique.":[47],"In":[48,86],"paper,":[50],"we":[51,97],"proposed":[52,99],"novel":[54],"method":[57],"to":[58,79,88,132,145],"identify":[59],"document\u2013summary":[62,84],"pairs":[63,68],"building":[65],"dataset.":[69],"Concretely,":[70],"long":[72],"short-term":[73],"memory":[74],"(LSTM)-based":[75],"model":[76,103],"was":[77],"designed":[78],"measure":[80],"the":[81,106,110,116,120,136,146],"pairs.":[85],"order":[87],"leverage":[89],"information":[90],"across":[91],"all":[92],"parts":[93],"each":[95],"further":[98],"an":[100],"improved":[101],"LSTM-based":[102,137],"by":[104],"removing":[105],"forget":[107],"gate":[108],"LSTM":[111],"unit.":[112],"Experiments":[113],"conducted":[114],"on":[115],"training":[117],"set":[118,122],"and":[119],"test":[121],"built":[123],"upon":[124],"Sina":[125],"Weibo":[126],"(a":[127],"Chinese":[128],"microblog":[129],"website":[130],"similar":[131],"Twitter)":[133],"showed":[134],"that":[135],"models":[138,142],"significantly":[139],"outperformed":[140],"baseline":[141],"with":[143],"regard":[144],"area":[147],"under":[148],"receiver":[149],"operating":[150],"characteristic":[151],"curve":[152],"(AUC)":[153],"value.":[154]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":2}],"updated_date":"2026-06-06T09:05:17.133730","created_date":"2025-10-10T00:00:00"}
