{"id":"https://openalex.org/W4404291558","doi":"https://doi.org/10.1007/s40747-024-01653-3","title":"Automatical sampling with heterogeneous corpora for grammatical error correction","display_name":"Automatical sampling with heterogeneous corpora for grammatical error correction","publication_year":2024,"publication_date":"2024-11-12","ids":{"openalex":"https://openalex.org/W4404291558","doi":"https://doi.org/10.1007/s40747-024-01653-3"},"language":"en","primary_location":{"id":"doi:10.1007/s40747-024-01653-3","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s40747-024-01653-3","pdf_url":"https://link.springer.com/content/pdf/10.1007/s40747-024-01653-3.pdf","source":{"id":"https://openalex.org/S3035462843","display_name":"Complex & Intelligent Systems","issn_l":"2198-6053","issn":["2198-6053","2199-4536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Complex &amp; Intelligent Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://link.springer.com/content/pdf/10.1007/s40747-024-01653-3.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5081426155","display_name":"Simeng Zhu","orcid":"https://orcid.org/0000-0003-0850-6690"},"institutions":[{"id":"https://openalex.org/I10660446","display_name":"Kunming University of Science and Technology","ror":"https://ror.org/00xyeez13","country_code":"CN","type":"education","lineage":["https://openalex.org/I10660446"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shichang Zhu","raw_affiliation_strings":["Faculty of Information Engineering and Automation, Yunnan Key Laboratory of Artificial Intelligence, Kunming University of Science and Technology, Kunming, China"],"affiliations":[{"raw_affiliation_string":"Faculty of Information Engineering and Automation, Yunnan Key Laboratory of Artificial Intelligence, Kunming University of Science and Technology, Kunming, China","institution_ids":["https://openalex.org/I10660446"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054206349","display_name":"Jianjian Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I10660446","display_name":"Kunming University of Science and Technology","ror":"https://ror.org/00xyeez13","country_code":"CN","type":"education","lineage":["https://openalex.org/I10660446"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianjian Liu","raw_affiliation_strings":["Faculty of Information Engineering and Automation, Yunnan Key Laboratory of Artificial Intelligence, Kunming University of Science and Technology, Kunming, China"],"affiliations":[{"raw_affiliation_string":"Faculty of Information Engineering and Automation, Yunnan Key Laboratory of Artificial Intelligence, Kunming University of Science and Technology, Kunming, China","institution_ids":["https://openalex.org/I10660446"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100414164","display_name":"Ying Li","orcid":"https://orcid.org/0000-0002-1800-0901"},"institutions":[{"id":"https://openalex.org/I10660446","display_name":"Kunming University of Science and Technology","ror":"https://ror.org/00xyeez13","country_code":"CN","type":"education","lineage":["https://openalex.org/I10660446"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ying Li","raw_affiliation_strings":["Faculty of Information Engineering and Automation, Yunnan Key Laboratory of Artificial Intelligence, Kunming University of Science and Technology, Kunming, China"],"affiliations":[{"raw_affiliation_string":"Faculty of Information Engineering and Automation, Yunnan Key Laboratory of Artificial Intelligence, Kunming University of Science and Technology, Kunming, China","institution_ids":["https://openalex.org/I10660446"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5114488777","display_name":"Zhengtao Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I10660446","display_name":"Kunming University of Science and Technology","ror":"https://ror.org/00xyeez13","country_code":"CN","type":"education","lineage":["https://openalex.org/I10660446"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhengtao Yu","raw_affiliation_strings":["Faculty of Information Engineering and Automation, Yunnan Key Laboratory of Artificial Intelligence, Kunming University of Science and Technology, Kunming, China"],"affiliations":[{"raw_affiliation_string":"Faculty of Information Engineering and Automation, Yunnan Key Laboratory of Artificial Intelligence, Kunming University of Science and Technology, Kunming, China","institution_ids":["https://openalex.org/I10660446"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5081426155"],"corresponding_institution_ids":["https://openalex.org/I10660446"],"apc_list":{"value":1320,"currency":"GBP","value_usd":1619},"apc_paid":{"value":1320,"currency":"GBP","value_usd":1619},"fwci":0.3369,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.67867407,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"11","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9901999831199646,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computational-intelligence","display_name":"Computational intelligence","score":0.6635974049568176},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.6155120134353638},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5198403000831604},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5093449354171753},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4796909987926483},{"id":"https://openalex.org/keywords/sampling-error","display_name":"Sampling error","score":0.43609219789505005},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.3853839337825775},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.29540377855300903},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.27344781160354614},{"id":"https://openalex.org/keywords/observational-error","display_name":"Observational error","score":0.08998891711235046},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.0804905891418457},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.061967700719833374}],"concepts":[{"id":"https://openalex.org/C139502532","wikidata":"https://www.wikidata.org/wiki/Q1122090","display_name":"Computational intelligence","level":2,"score":0.6635974049568176},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.6155120134353638},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5198403000831604},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5093449354171753},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4796909987926483},{"id":"https://openalex.org/C165473641","wikidata":"https://www.wikidata.org/wiki/Q3306280","display_name":"Sampling error","level":3,"score":0.43609219789505005},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.3853839337825775},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.29540377855300903},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.27344781160354614},{"id":"https://openalex.org/C19619285","wikidata":"https://www.wikidata.org/wiki/Q196372","display_name":"Observational error","level":2,"score":0.08998891711235046},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0804905891418457},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.061967700719833374},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/s40747-024-01653-3","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s40747-024-01653-3","pdf_url":"https://link.springer.com/content/pdf/10.1007/s40747-024-01653-3.pdf","source":{"id":"https://openalex.org/S3035462843","display_name":"Complex & Intelligent Systems","issn_l":"2198-6053","issn":["2198-6053","2199-4536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Complex &amp; Intelligent Systems","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:c317d7bcdd2a47529935c35ada7e8d56","is_oa":true,"landing_page_url":"https://doaj.org/article/c317d7bcdd2a47529935c35ada7e8d56","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Complex & Intelligent Systems, Vol 11, Iss 1, Pp 1-11 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1007/s40747-024-01653-3","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s40747-024-01653-3","pdf_url":"https://link.springer.com/content/pdf/10.1007/s40747-024-01653-3.pdf","source":{"id":"https://openalex.org/S3035462843","display_name":"Complex & Intelligent Systems","issn_l":"2198-6053","issn":["2198-6053","2199-4536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Complex &amp; Intelligent Systems","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.5199999809265137,"id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G1070218178","display_name":null,"funder_award_id":"F0701","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G160098265","display_name":null,"funder_award_id":"202401","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1740161482","display_name":null,"funder_award_id":"62306129, U21B2027, 62366027","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2374625443","display_name":null,"funder_award_id":"202103AA080015","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3216677882","display_name":null,"funder_award_id":"201606","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3310436768","display_name":null,"funder_award_id":"62366027","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3780253623","display_name":null,"funder_award_id":"62266028","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4479882814","display_name":null,"funder_award_id":"U21B2027","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5760752404","display_name":null,"funder_award_id":"Projects","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5881942141","display_name":null,"funder_award_id":"202103","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5939423041","display_name":null,"funder_award_id":"Technology","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8955107213","display_name":null,"funder_award_id":"Major","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320324302","display_name":"Kunming University of Science and Technology","ror":"https://ror.org/00xyeez13"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4404291558.pdf"},"referenced_works_count":31,"referenced_works":["https://openalex.org/W2168322422","https://openalex.org/W2194775991","https://openalex.org/W2251873470","https://openalex.org/W2589277916","https://openalex.org/W2886474102","https://openalex.org/W2914707095","https://openalex.org/W2945059185","https://openalex.org/W2963881719","https://openalex.org/W2964082031","https://openalex.org/W2970076840","https://openalex.org/W2997636815","https://openalex.org/W2999970869","https://openalex.org/W3034999214","https://openalex.org/W3037002737","https://openalex.org/W3037162118","https://openalex.org/W3093312917","https://openalex.org/W3104669693","https://openalex.org/W3104681546","https://openalex.org/W4224921333","https://openalex.org/W4385567238","https://openalex.org/W4385570567","https://openalex.org/W4385570694","https://openalex.org/W4385570817","https://openalex.org/W4385571043","https://openalex.org/W4385571296","https://openalex.org/W4385571532","https://openalex.org/W4385571866","https://openalex.org/W4385573567","https://openalex.org/W4385573850","https://openalex.org/W4389518883","https://openalex.org/W4389519894"],"related_works":["https://openalex.org/W2005846717","https://openalex.org/W4245369150","https://openalex.org/W2356796168","https://openalex.org/W99741415","https://openalex.org/W1977524596","https://openalex.org/W129898351","https://openalex.org/W1530382326","https://openalex.org/W4212775797","https://openalex.org/W2021715390","https://openalex.org/W1967821533"],"abstract_inverted_index":{"Thanks":[0],"to":[1,58,97],"the":[2,7,26,39,115,141,151,156,167,180],"strong":[3],"representation":[4],"capability":[5],"of":[6,29,41,80,143,159,169,182],"pre-trained":[8,130],"language":[9,131],"models,":[10],"supervised":[11],"grammatical":[12,125,170],"error":[13,81,126,171],"correction":[14,127],"has":[15],"achieved":[16],"promising":[17],"performance.":[18],"However,":[19],"traditional":[20],"model":[21,34,136],"training":[22,42],"depends":[23],"significantly":[24],"on":[25,87,106,150],"large":[27],"scale":[28],"similar":[30],"distributed":[31],"samples.":[32,148],"The":[33,173],"performance":[35],"decreases":[36],"sharply":[37],"once":[38],"distributions":[40,86],"and":[43,66,83,113,123,133,146],"testing":[44],"data":[45],"are":[46],"inconsistent.":[47],"To":[48],"address":[49],"this":[50],"issue,":[51],"we":[52,74,119],"propose":[53],"an":[54],"automatic":[55],"sampling":[56],"approach":[57,94],"effectively":[59],"select":[60],"high-quality":[61],"samples":[62,112],"from":[63],"different":[64,99,160,183],"corpora":[65,161],"filter":[67],"out":[68],"irrelevant":[69],"or":[70],"harmful":[71],"ones.":[72,117],"Concretely,":[73],"first":[75],"provide":[76],"a":[77,135],"detailed":[78,174],"analysis":[79,107,175],"type":[82],"sentence":[84],"length":[85],"all":[88],"datasets.":[89],"Second,":[90],"our":[91],"corpus":[92,184],"weighting":[93,185],"is":[95,162],"exploited":[96],"yield":[98],"weights":[100],"for":[101,139],"each":[102],"sample":[103],"automatically":[104],"based":[105],"results,":[108],"thus":[109],"emphasizing":[110],"beneficial":[111],"ignoring":[114],"noisy":[116],"Finally,":[118],"enhance":[120],"typical":[121],"Seq2Seq":[122],"Seq2Edit":[124],"models":[128,132,145],"with":[129],"design":[134],"ensemble":[137],"algorithm":[138],"integrating":[140],"advantages":[142],"heterogeneous":[144],"weighted":[147],"Experiments":[149],"benchmark":[152],"datasets":[153],"demonstrate":[154],"that":[155],"proper":[157],"utilization":[158],"extremely":[163],"helpful":[164],"in":[165],"enhancing":[166],"accuracy":[168],"correction.":[172],"gains":[176],"more":[177],"insights":[178],"into":[179],"effect":[181],"strategies.":[186]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-16T08:26:57.006410","created_date":"2025-10-10T00:00:00"}
