{"id":"https://openalex.org/W4406458265","doi":"https://doi.org/10.1109/bigdata62323.2024.10825107","title":"Text Summary Generation based on Data Augmentation and Contrastive Learning","display_name":"Text Summary Generation based on Data Augmentation and Contrastive Learning","publication_year":2024,"publication_date":"2024-12-15","ids":{"openalex":"https://openalex.org/W4406458265","doi":"https://doi.org/10.1109/bigdata62323.2024.10825107"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata62323.2024.10825107","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825107","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100677096","display_name":"Jenq\u2010Haur Wang","orcid":"https://orcid.org/0000-0002-6076-7380"},"institutions":[{"id":"https://openalex.org/I118292597","display_name":"National Taipei University of Technology","ror":"https://ror.org/00cn92c09","country_code":"TW","type":"education","lineage":["https://openalex.org/I118292597"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Jenq-Haur Wang","raw_affiliation_strings":["National Taipei University of Technology,Department of Computer Science and Information Engineering,Taipei,Taiwan"],"affiliations":[{"raw_affiliation_string":"National Taipei University of Technology,Department of Computer Science and Information Engineering,Taipei,Taiwan","institution_ids":["https://openalex.org/I118292597"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101609096","display_name":"J. Zhuang","orcid":"https://orcid.org/0000-0002-2765-6339"},"institutions":[{"id":"https://openalex.org/I118292597","display_name":"National Taipei University of Technology","ror":"https://ror.org/00cn92c09","country_code":"TW","type":"education","lineage":["https://openalex.org/I118292597"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Jie-An Zhuang","raw_affiliation_strings":["National Taipei University of Technology,Department of Computer Science and Information Engineering,Taipei,Taiwan"],"affiliations":[{"raw_affiliation_string":"National Taipei University of Technology,Department of Computer Science and Information Engineering,Taipei,Taiwan","institution_ids":["https://openalex.org/I118292597"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5100677096"],"corresponding_institution_ids":["https://openalex.org/I118292597"],"apc_list":null,"apc_paid":null,"fwci":0.3626,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.70774619,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"7218","last_page":"7224"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7514068484306335},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5317603349685669},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44693857431411743}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7514068484306335},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5317603349685669},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44693857431411743}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata62323.2024.10825107","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825107","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320331164","display_name":"National Science and Technology Council","ror":"https://ror.org/00wnb9798"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W2154652894","https://openalex.org/W2170240176","https://openalex.org/W2606974598","https://openalex.org/W2888482885","https://openalex.org/W2888556271","https://openalex.org/W2924690340","https://openalex.org/W2949615363","https://openalex.org/W2952138241","https://openalex.org/W2965373594","https://openalex.org/W2970419734","https://openalex.org/W3035252911","https://openalex.org/W3156636935","https://openalex.org/W3173210704","https://openalex.org/W3175362188","https://openalex.org/W3175875420","https://openalex.org/W3197319555","https://openalex.org/W4205480693","https://openalex.org/W4205807230","https://openalex.org/W4225934689","https://openalex.org/W4226404354","https://openalex.org/W4226405594","https://openalex.org/W4385245566","https://openalex.org/W6631501603","https://openalex.org/W6632455782","https://openalex.org/W6682631176","https://openalex.org/W6685053522","https://openalex.org/W6755207826","https://openalex.org/W6761268247","https://openalex.org/W6766673545","https://openalex.org/W6771915120","https://openalex.org/W6843992823"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W3204019825"],"abstract_inverted_index":{"In":[0,140],"recent":[1],"years,":[2],"there":[3],"has":[4,50],"been":[5],"a":[6,130,237],"rapid":[7],"growth":[8],"in":[9,68,112,207,265,268],"the":[10,155,168,171,183,189,196,224,251,263],"volume":[11,39],"of":[12,60,240,245,253],"textual":[13],"data":[14,116,146],"generated":[15],"from":[16,126],"various":[17,27,269],"sources,":[18],"including":[19],"industries,":[20],"news":[21],"media,":[22,25],"and":[23,34,62,91,120,129,136,153,177,198,215,242,247],"social":[24],"across":[26],"fields":[28],"worldwide.":[29],"It":[30],"contains":[31,118],"valuable":[32],"information":[33,61],"knowledge,":[35],"but":[36],"its":[37],"sheer":[38],"requires":[40],"effective":[41],"summarization":[42,49,76],"techniques":[43],"to":[44,148,164,166,212,223,261],"make":[45],"it":[46],"useful.":[47],"Text":[48],"thus":[51],"become":[52],"an":[53],"important":[54],"technology":[55],"for":[56,101],"distilling":[57],"large":[58,69],"amounts":[59],"capturing":[63],"key":[64],"insights.":[65],"With":[66],"advancements":[67],"language":[70,123],"models":[71,77,80,85,108,124,214],"(LLMs),":[72],"most":[73,121],"existing":[74,216],"abstractive":[75],"leverage":[78],"pretrained":[79,122,213],"such":[81],"as":[82,188],"BART.":[83],"These":[84,107],"are":[86],"based":[87],"on":[88,98,195],"Transformer":[89],"architectures":[90],"undergo":[92],"unsupervised":[93],"pretraining,":[94],"followed":[95],"by":[96],"fine-tuning":[97],"specific":[99],"datasets":[100,200],"downstream":[102],"tasks,":[103],"particularly":[104],"text":[105,151,209],"summarization.":[106],"have":[109],"demonstrated":[110],"superiority":[111],"this":[113,141,203],"field.":[114],"Real-world":[115],"often":[117],"noise,":[119],"suffer":[125],"exposure":[127],"bias":[128],"discrepancy":[131],"between":[132,170],"their":[133],"training":[134],"objectives":[135],"real":[137],"evaluation":[138],"metrics.":[139],"paper,":[142],"we":[143],"introduce":[144],"sentence-level":[145],"augmentation":[147],"simulate":[149],"real-world":[150,266],"variations":[152],"enhance":[154],"model's":[156],"denoising":[157],"capability.":[158],"Furthermore,":[159],"contrastive":[160,219,231],"learning":[161,226],"is":[162,186,259],"employed":[163],"learn":[165],"distinguish":[167],"differences":[169],"original":[172],"article":[173,185],"with":[174,218,230],"candidate":[175,179],"summaries":[176,180,210],"among":[178],"themselves.":[181],"Finally,":[182],"highest-scoring":[184],"output":[187],"resulting":[190],"summary.":[191],"The":[192],"experimental":[193],"results":[194],"CNN/DailyMail":[197],"XSum":[199],"indicate":[201],"that":[202],"model":[204],"shows":[205,250],"improvement":[206],"generating":[208],"compared":[211],"methods":[217],"learning.":[220],"When":[221],"comparing":[222],"multitask":[225],"framework":[227],"BRIO":[228],"variant":[229],"loss,":[232],"our":[233,254],"proposed":[234,255],"method":[235],"achieves":[236],"better":[238],"ROUGE-1":[239],"48.52":[241],"comparable":[243],"ROUGE-2/L":[244],"24.84":[246],"39.78.":[248],"This":[249],"potential":[252],"method.":[256],"Further":[257],"investigation":[258],"needed":[260],"verify":[262],"performance":[264],"texts":[267],"domains.":[270]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
