{"id":"https://openalex.org/W4312891566","doi":"https://doi.org/10.1109/ijcnn55064.2022.9892341","title":"3Rs: Data Augmentation Techniques Using Document Contexts For Low-Resource Chinese Named Entity Recognition","display_name":"3Rs: Data Augmentation Techniques Using Document Contexts For Low-Resource Chinese Named Entity Recognition","publication_year":2022,"publication_date":"2022-07-18","ids":{"openalex":"https://openalex.org/W4312891566","doi":"https://doi.org/10.1109/ijcnn55064.2022.9892341"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn55064.2022.9892341","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn55064.2022.9892341","pdf_url":null,"source":{"id":"https://openalex.org/S4363607707","display_name":"2022 International Joint Conference on Neural Networks (IJCNN)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047683619","display_name":"Zheyu Ying","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zheyu Ying","raw_affiliation_strings":["National Engineering Research Center for Software Engineering, Peking University","School of Software and Microelectronics, Peking University"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Software Engineering, Peking University","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"School of Software and Microelectronics, Peking University","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089592709","display_name":"Jinglei Zhang","orcid":"https://orcid.org/0000-0003-1438-6568"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinglei Zhang","raw_affiliation_strings":["National Engineering Research Center for Software Engineering, Peking University","School of Software and Microelectronics, Peking University"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Software Engineering, Peking University","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"School of Software and Microelectronics, Peking University","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014268902","display_name":"Rui Xie","orcid":"https://orcid.org/0000-0002-1756-7746"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rui Xie","raw_affiliation_strings":["National Engineering Research Center for Software Engineering, Peking University"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Software Engineering, Peking University","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005473471","display_name":"Guochang Wen","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guochang Wen","raw_affiliation_strings":["National Engineering Research Center for Software Engineering, Peking University","School of Software and Microelectronics, Peking University"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Software Engineering, Peking University","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"School of Software and Microelectronics, Peking University","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100964132","display_name":"Feng Xiao","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Feng Xiao","raw_affiliation_strings":["National Engineering Research Center for Software Engineering, Peking University","School of Software and Microelectronics, Peking University"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Software Engineering, Peking University","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"School of Software and Microelectronics, Peking University","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102800878","display_name":"Xueyang Liu","orcid":"https://orcid.org/0009-0005-4063-9938"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xueyang Liu","raw_affiliation_strings":["National Engineering Research Center for Software Engineering, Peking University"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Software Engineering, Peking University","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101435571","display_name":"Shikun Zhang","orcid":"https://orcid.org/0000-0002-8576-2674"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shikun Zhang","raw_affiliation_strings":["National Engineering Research Center for Software Engineering, Peking University"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Software Engineering, Peking University","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5047683619"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.16445809,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"7","issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9829000234603882,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8346160650253296},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.7863022089004517},{"id":"https://openalex.org/keywords/named-entity-recognition","display_name":"Named-entity recognition","score":0.6189092993736267},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5815117359161377},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.5665438771247864},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.5026414394378662},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4659633934497833},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4634760320186615},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.4583771228790283},{"id":"https://openalex.org/keywords/random-forest","display_name":"Random forest","score":0.4315699338912964},{"id":"https://openalex.org/keywords/conditional-random-field","display_name":"Conditional random field","score":0.42152416706085205},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.34822142124176025}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8346160650253296},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.7863022089004517},{"id":"https://openalex.org/C2779135771","wikidata":"https://www.wikidata.org/wiki/Q403574","display_name":"Named-entity recognition","level":3,"score":0.6189092993736267},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5815117359161377},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.5665438771247864},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.5026414394378662},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4659633934497833},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4634760320186615},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.4583771228790283},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.4315699338912964},{"id":"https://openalex.org/C152565575","wikidata":"https://www.wikidata.org/wiki/Q1124538","display_name":"Conditional random field","level":2,"score":0.42152416706085205},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.34822142124176025},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn55064.2022.9892341","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn55064.2022.9892341","pdf_url":null,"source":{"id":"https://openalex.org/S4363607707","display_name":"2022 International Joint Conference on Neural Networks (IJCNN)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W1940872118","https://openalex.org/W1964162497","https://openalex.org/W2020278455","https://openalex.org/W2107598941","https://openalex.org/W2147218300","https://openalex.org/W2610850660","https://openalex.org/W2746314669","https://openalex.org/W2765407302","https://openalex.org/W2896457183","https://openalex.org/W2904415434","https://openalex.org/W2911489562","https://openalex.org/W2911588830","https://openalex.org/W2944223741","https://openalex.org/W2946068894","https://openalex.org/W2965373594","https://openalex.org/W2971296908","https://openalex.org/W2975059944","https://openalex.org/W2981573048","https://openalex.org/W2992308087","https://openalex.org/W2996428491","https://openalex.org/W2998508940","https://openalex.org/W3017961061","https://openalex.org/W3019125528","https://openalex.org/W3034238904","https://openalex.org/W3034340683","https://openalex.org/W3034379414","https://openalex.org/W3035625205","https://openalex.org/W3098341425","https://openalex.org/W3108842736","https://openalex.org/W3127662747","https://openalex.org/W3169506265","https://openalex.org/W3173277985","https://openalex.org/W3174311454","https://openalex.org/W3174828871","https://openalex.org/W3177330184","https://openalex.org/W3188708541","https://openalex.org/W3199520873","https://openalex.org/W4200046541","https://openalex.org/W6640362995"],"related_works":["https://openalex.org/W4250494529","https://openalex.org/W1964783010","https://openalex.org/W2399696375","https://openalex.org/W45206245","https://openalex.org/W2211396092","https://openalex.org/W2078793151","https://openalex.org/W2061834489","https://openalex.org/W2751906762","https://openalex.org/W3088215229","https://openalex.org/W3047727388"],"abstract_inverted_index":{"With":[0,58],"recent":[1,19],"advances":[2],"of":[3,28,35,60,109],"neural":[4],"networks":[5],"and":[6,38,71,88,112,129,153],"pre-training":[7],"techniques,":[8],"Chinese":[9,69,127],"Named":[10],"Entity":[11],"Recognition":[12],"(NER)":[13],"has":[14],"achieved":[15],"great":[16],"progress":[17],"in":[18,56,100],"years.":[20],"However,":[21],"NER":[22,40,70,82],"systems":[23],"still":[24],"have":[25],"the":[26,107,145],"problem":[27],"generalization":[29],"ability":[30],"issues":[31],"due":[32],"to":[33,105,135],"lack":[34],"annotated":[36],"data,":[37],"current":[39],"models":[41,49],"mostly":[42],"consider":[43],"input":[44],"sentences":[45],"individually,":[46],"which":[47,91],"prevent":[48],"from":[50],"further":[51],"exploiting":[52],"cross-sentence":[53],"document":[54],"context":[55],"training.":[57],"regard":[59],"these":[61],"problems,":[62],"this":[63],"paper":[64],"present":[65],"new":[66],"insights":[67],"into":[68],"propose":[72],"3Rs:":[73],"three":[74],"data":[75,97],"augmentation":[76,98],"methods":[77],"incorporating":[78],"document-level":[79],"information":[80],"for":[81,156],"through":[83],"random":[84,86,89],"concatenating,":[85],"swapping":[87],"erasing,":[90],"are":[92],"inspired":[93],"by":[94],"some":[95],"multi-sample":[96],"techniques":[99],"computer":[101],"vision":[102],"fields,":[103],"aiming":[104],"reorganize":[106],"composition":[108],"training":[110,115,158],"sentences,":[111],"generate":[113],"more":[114],"examples":[116],"with":[117],"less":[118],"human":[119],"efforts.":[120],"We":[121],"conduct":[122],"extensive":[123],"experiments":[124],"on":[125,164],"two":[126],"datasets,":[128],"introduce":[130],"a":[131,150],"two-level":[132],"attacking":[133],"method":[134],"audit":[136],"robustness":[137],"performance.":[138],"Our":[139],"experiment":[140],"results":[141],"show":[142],"that":[143],"even":[144],"best":[146],"model":[147],"can":[148],"obtain":[149],"better":[151],"accuracy":[152],"robustness,":[154],"especially":[155],"smaller":[157],"sets,":[159],"therefore":[160],"alleviating":[161],"performance":[162],"bottlenecks":[163],"low-resource":[165],"conditions.":[166]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
