{"id":"https://openalex.org/W4382201666","doi":"https://doi.org/10.1145/3582768.3582797","title":"A corpus of drafts of NLP papers from non-native English speakers","display_name":"A corpus of drafts of NLP papers from non-native English speakers","publication_year":2022,"publication_date":"2022-12-16","ids":{"openalex":"https://openalex.org/W4382201666","doi":"https://doi.org/10.1145/3582768.3582797"},"language":"en","primary_location":{"id":"doi:10.1145/3582768.3582797","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3582768.3582797","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 6th International Conference on Natural Language Processing and Information Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075351291","display_name":"Haotong Wang","orcid":"https://orcid.org/0000-0003-3209-5932"},"institutions":[{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Haotong Wang","raw_affiliation_strings":["Graduate School of Information, Production and Systems, Waseda University, Japan"],"raw_orcid":"https://orcid.org/0000-0003-3209-5932","affiliations":[{"raw_affiliation_string":"Graduate School of Information, Production and Systems, Waseda University, Japan","institution_ids":["https://openalex.org/I150744194"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100416798","display_name":"Liyan Wang","orcid":"https://orcid.org/0000-0002-9561-5037"},"institutions":[{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Liyan Wang","raw_affiliation_strings":["Graduate School of Information, Production and Systems, Waseda University, Japan"],"raw_orcid":"https://orcid.org/0000-0002-9561-5037","affiliations":[{"raw_affiliation_string":"Graduate School of Information, Production and Systems, Waseda University, Japan","institution_ids":["https://openalex.org/I150744194"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060121645","display_name":"Yves Lepage","orcid":"https://orcid.org/0000-0002-3059-4271"},"institutions":[{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Lepage Yves","raw_affiliation_strings":["Graduate School of Information, Production and Systems, Waseda University, Japan"],"raw_orcid":"https://orcid.org/0000-0002-3059-4271","affiliations":[{"raw_affiliation_string":"Graduate School of Information, Production and Systems, Waseda University, Japan","institution_ids":["https://openalex.org/I150744194"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5075351291"],"corresponding_institution_ids":["https://openalex.org/I150744194"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.19361313,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"125","last_page":"129"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8456922769546509},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.7916520237922668},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7187920212745667},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.6592256426811218},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6414089798927307},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.6155072450637817},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5453923344612122},{"id":"https://openalex.org/keywords/parallel-corpora","display_name":"Parallel corpora","score":0.49659115076065063},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3415578603744507},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.3217829465866089},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.23696082830429077}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8456922769546509},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.7916520237922668},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7187920212745667},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.6592256426811218},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6414089798927307},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.6155072450637817},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5453923344612122},{"id":"https://openalex.org/C2985367798","wikidata":"https://www.wikidata.org/wiki/Q1346592","display_name":"Parallel corpora","level":3,"score":0.49659115076065063},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3415578603744507},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.3217829465866089},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.23696082830429077},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3582768.3582797","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3582768.3582797","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 6th International Conference on Natural Language Processing and Information Retrieval","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8199999928474426,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W1481128830","https://openalex.org/W2117334662","https://openalex.org/W2181262297","https://openalex.org/W2250290162","https://openalex.org/W2295598076","https://openalex.org/W2602331152","https://openalex.org/W2962769776","https://openalex.org/W2964413085","https://openalex.org/W3114208363","https://openalex.org/W4234670185"],"related_works":["https://openalex.org/W2375873920","https://openalex.org/W2146114872","https://openalex.org/W2392060890","https://openalex.org/W2392760275","https://openalex.org/W2083530853","https://openalex.org/W2009831055","https://openalex.org/W2393172683","https://openalex.org/W3211744874","https://openalex.org/W1994626569","https://openalex.org/W2368686738"],"abstract_inverted_index":{"We":[0,59,92],"created":[1],"an":[2],"English":[3,47],"parallel":[4],"corpus":[5,66],"of":[6,33,42,64,97],"3,005":[7],"sentence":[8],"pairs,":[9],"each":[10],"containing":[11],"a":[12,61,76],"well-polished":[13],"text":[14],"from":[15,27,45,84],"ACL":[16],"Anthology":[17],"Reference":[18],"Corpus":[19],"(ACL-ARC)":[20],"[1]":[21],"and":[22],"corresponding":[23],"restated":[24],"drafts":[25,44,83],"collected":[26,111],"26":[28],"non-native":[29,46],"writers.":[30],"The":[31],"purpose":[32],"this":[34],"paper":[35],"is":[36],"to":[37,51,80,114],"explore":[38],"the":[39,43,65,95,102,110],"writing":[40],"features":[41,100,105],"speakers,":[48],"so":[49],"as":[50],"benefit":[52],"research":[53],"in":[54],"Academic":[55],"Writing":[56],"Aid":[57],"Systems.":[58],"present":[60],"feature":[62],"analysis":[63],"based":[67,88],"on":[68,89,109],"handcrafted":[69,104],"features.":[70,91],"To":[71],"assess":[72],"utility,":[73],"we":[74],"formulate":[75],"draft":[77],"identification":[78,107],"task":[79],"automatically":[81],"recognize":[82],"ground":[85],"truth":[86],"texts":[87],"hybrid":[90],"show":[93],"that":[94],"combination":[96],"deep":[98],"semantic":[99],"with":[101],"optimal":[103],"improves":[106],"accuracy":[108],"data,":[112],"up":[113],"84.57%.":[115]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
