{"id":"https://openalex.org/W2970238989","doi":"https://doi.org/10.18653/v1/w19-4445","title":"Application of an Automatic Plagiarism Detection System in a Large-scale Assessment of English Speaking Proficiency","display_name":"Application of an Automatic Plagiarism Detection System in a Large-scale Assessment of English Speaking Proficiency","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2970238989","doi":"https://doi.org/10.18653/v1/w19-4445","mag":"2970238989"},"language":"en","primary_location":{"id":"doi:10.18653/v1/w19-4445","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w19-4445","pdf_url":"https://www.aclweb.org/anthology/W19-4445.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Fourteenth Workshop on Innovative Use of NLP for Building Educational Applications","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/W19-4445.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100772594","display_name":"Xinhao Wang","orcid":"https://orcid.org/0000-0002-0366-7543"},"institutions":[{"id":"https://openalex.org/I1341030882","display_name":"Educational Testing Service","ror":"https://ror.org/03b5q4637","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1341030882"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Xinhao Wang","raw_affiliation_strings":["Educational Testing Service 1 90 New Montgomery St #1450, San Francisco, CA 94105, USA"],"affiliations":[{"raw_affiliation_string":"Educational Testing Service 1 90 New Montgomery St #1450, San Francisco, CA 94105, USA","institution_ids":["https://openalex.org/I1341030882"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030816616","display_name":"Keelan Evanini","orcid":"https://orcid.org/0000-0003-4243-3376"},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Keelan Evanini","raw_affiliation_strings":["660 Rosedale Road, Princeton, NJ 08541, USA"],"affiliations":[{"raw_affiliation_string":"660 Rosedale Road, Princeton, NJ 08541, USA","institution_ids":["https://openalex.org/I20089843"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108692434","display_name":"Matthew Mulholland","orcid":null},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Matthew Mulholland","raw_affiliation_strings":["660 Rosedale Road, Princeton, NJ 08541, USA"],"affiliations":[{"raw_affiliation_string":"660 Rosedale Road, Princeton, NJ 08541, USA","institution_ids":["https://openalex.org/I20089843"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100342006","display_name":"Yao Qian","orcid":"https://orcid.org/0000-0003-1855-9630"},"institutions":[{"id":"https://openalex.org/I1341030882","display_name":"Educational Testing Service","ror":"https://ror.org/03b5q4637","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I1341030882"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yao Qian","raw_affiliation_strings":["Educational Testing Service 1 90 New Montgomery St #1450, San Francisco, CA 94105, USA"],"affiliations":[{"raw_affiliation_string":"Educational Testing Service 1 90 New Montgomery St #1450, San Francisco, CA 94105, USA","institution_ids":["https://openalex.org/I1341030882"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048995937","display_name":"James V. Bruno","orcid":null},"institutions":[{"id":"https://openalex.org/I20089843","display_name":"Princeton University","ror":"https://ror.org/00hx57361","country_code":"US","type":"education","lineage":["https://openalex.org/I20089843"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"James V. Bruno","raw_affiliation_strings":["660 Rosedale Road, Princeton, NJ 08541, USA"],"affiliations":[{"raw_affiliation_string":"660 Rosedale Road, Princeton, NJ 08541, USA","institution_ids":["https://openalex.org/I20089843"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100772594"],"corresponding_institution_ids":["https://openalex.org/I1341030882"],"apc_list":null,"apc_paid":null,"fwci":0.1445,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.57848269,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"435","last_page":"443"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7672340869903564},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6642330288887024},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.576873242855072},{"id":"https://openalex.org/keywords/plagiarism-detection","display_name":"Plagiarism detection","score":0.5722032189369202},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.533397912979126},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.494307279586792},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.47440338134765625},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4614798426628113},{"id":"https://openalex.org/keywords/recall","display_name":"Recall","score":0.4604504704475403},{"id":"https://openalex.org/keywords/language-proficiency","display_name":"Language proficiency","score":0.44491639733314514},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.43044963479042053},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.1506049633026123},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.13061794638633728},{"id":"https://openalex.org/keywords/mathematics-education","display_name":"Mathematics education","score":0.1021413803100586}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7672340869903564},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6642330288887024},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.576873242855072},{"id":"https://openalex.org/C2780907237","wikidata":"https://www.wikidata.org/wiki/Q2986238","display_name":"Plagiarism detection","level":2,"score":0.5722032189369202},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.533397912979126},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.494307279586792},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.47440338134765625},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4614798426628113},{"id":"https://openalex.org/C100660578","wikidata":"https://www.wikidata.org/wiki/Q18733","display_name":"Recall","level":2,"score":0.4604504704475403},{"id":"https://openalex.org/C2778883600","wikidata":"https://www.wikidata.org/wiki/Q2390977","display_name":"Language proficiency","level":2,"score":0.44491639733314514},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.43044963479042053},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.1506049633026123},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.13061794638633728},{"id":"https://openalex.org/C145420912","wikidata":"https://www.wikidata.org/wiki/Q853077","display_name":"Mathematics education","level":1,"score":0.1021413803100586},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/w19-4445","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w19-4445","pdf_url":"https://www.aclweb.org/anthology/W19-4445.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Fourteenth Workshop on Innovative Use of NLP for Building Educational Applications","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/w19-4445","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w19-4445","pdf_url":"https://www.aclweb.org/anthology/W19-4445.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Fourteenth Workshop on Innovative Use of NLP for Building Educational Applications","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8199999928474426,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2970238989.pdf","grobid_xml":"https://content.openalex.org/works/W2970238989.grobid-xml"},"referenced_works_count":24,"referenced_works":["https://openalex.org/W270731963","https://openalex.org/W658020064","https://openalex.org/W1493309689","https://openalex.org/W1544505227","https://openalex.org/W1575261888","https://openalex.org/W1596691921","https://openalex.org/W1974336599","https://openalex.org/W1979364015","https://openalex.org/W2049422789","https://openalex.org/W2069985874","https://openalex.org/W2101234009","https://openalex.org/W2113403290","https://openalex.org/W2122355855","https://openalex.org/W2125101937","https://openalex.org/W2147742901","https://openalex.org/W2150862929","https://openalex.org/W2170494111","https://openalex.org/W2251574625","https://openalex.org/W2398753020","https://openalex.org/W2404948255","https://openalex.org/W2586177144","https://openalex.org/W2787381839","https://openalex.org/W3006365793","https://openalex.org/W3008251515"],"related_works":["https://openalex.org/W4287126803","https://openalex.org/W3168266056","https://openalex.org/W4250737080","https://openalex.org/W2735162248","https://openalex.org/W2112890327","https://openalex.org/W311440260","https://openalex.org/W2945111072","https://openalex.org/W1496191935","https://openalex.org/W3080940603","https://openalex.org/W17414112"],"abstract_inverted_index":{"This":[0,121],"study":[1],"aims":[2],"to":[3,32,154],"build":[4],"an":[5,19,76,93,113],"automatic":[6],"system":[7,122,149],"for":[8,25,59,70],"the":[9,16,54,102,118,135,147,156],"detection":[10,58],"of":[11,18,21,43,56,115,134,141,158,164],"plagiarized":[12,35,119],"spoken":[13,166],"responses":[14,38,128],"in":[15,53,112],"context":[17],"assessment":[20,97,136,163],"English":[22,95],"speaking":[23,63],"proficiency":[24,64,96],"non-native":[26,165],"speakers.":[27],"Classification":[28],"models":[29],"were":[30,67,83],"trained":[31],"distinguish":[33],"between":[34],"and":[36,62,73,101,137,161],"nonplagiarized":[37],"with":[39],"two":[40],"different":[41],"types":[42],"features:":[44],"text-to-text":[45],"content":[46],"similarity":[47],"measures,":[48,65],"which":[49,66],"are":[50],"commonly":[51],"used":[52,153],"task":[55],"plagiarism":[57],"written":[60],"documents,":[61],"specifically":[68],"designed":[69],"spontaneous":[71],"speech":[72,78],"extracted":[74],"using":[75],"automated":[77,162],"scoring":[79],"system.":[80],"The":[81,143],"experiments":[82],"first":[84],"conducted":[85],"on":[86,105,117,126],"a":[87,131,139],"large":[88],"data":[89,109],"set":[90,110],"drawn":[91],"from":[92,130],"operational":[94,127],"across":[98],"multiple":[99],"years,":[100],"best":[103],"classifier":[104],"this":[106],"heavily":[107],"imbalanced":[108],"resulted":[111],"F1-score":[114],"0.761":[116],"class.":[120],"was":[123],"then":[124],"validated":[125],"collected":[129],"single":[132],"administration":[133],"achieved":[138],"recall":[140],"0.897.":[142],"results":[144],"indicate":[145],"that":[146],"proposed":[148],"can":[150],"potentially":[151],"be":[152],"improve":[155],"validity":[157],"both":[159],"human":[160],"English.":[167]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2019,"cited_by_count":1}],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
