{"id":"https://openalex.org/W2147528976","doi":"https://doi.org/10.1162/coli_a_00153","title":"Plagiarism Meets Paraphrasing: Insights for the Next Generation in Automatic Plagiarism Detection","display_name":"Plagiarism Meets Paraphrasing: Insights for the Next Generation in Automatic Plagiarism Detection","publication_year":2013,"publication_date":"2013-01-03","ids":{"openalex":"https://openalex.org/W2147528976","doi":"https://doi.org/10.1162/coli_a_00153","mag":"2147528976"},"language":"en","primary_location":{"id":"doi:10.1162/coli_a_00153","is_oa":false,"landing_page_url":"https://doi.org/10.1162/coli_a_00153","pdf_url":null,"source":{"id":"https://openalex.org/S155526855","display_name":"Computational Linguistics","issn_l":"0891-2017","issn":["0891-2017","1530-9312"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Linguistics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://hdl.handle.net/2117/20297","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067489760","display_name":"Alberto Barr\u00f3n\u2010Cede\u00f1o","orcid":"https://orcid.org/0000-0003-4719-3420"},"institutions":[{"id":"https://openalex.org/I9617848","display_name":"Universitat Polit\u00e8cnica de Catalunya","ror":"https://ror.org/03mb6wj31","country_code":"ES","type":"education","lineage":["https://openalex.org/I9617848"]}],"countries":["ES"],"is_corresponding":true,"raw_author_name":"Alberto Barr\u00f3n-Cede\u00f1o","raw_affiliation_strings":["Universitat Polit\u00e8cnica de Catalunya"],"affiliations":[{"raw_affiliation_string":"Universitat Polit\u00e8cnica de Catalunya","institution_ids":["https://openalex.org/I9617848"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012230079","display_name":"Marta Gatius Vila","orcid":"https://orcid.org/0000-0003-0456-7912"},"institutions":[{"id":"https://openalex.org/I71999127","display_name":"Universitat de Barcelona","ror":"https://ror.org/021018s57","country_code":"ES","type":"education","lineage":["https://openalex.org/I71999127"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Marta Vila","raw_affiliation_strings":["Universitat de Barcelona"],"affiliations":[{"raw_affiliation_string":"Universitat de Barcelona","institution_ids":["https://openalex.org/I71999127"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041689337","display_name":"M. Ant\u00f2nia Mart\u00ed","orcid":"https://orcid.org/0000-0002-8849-6826"},"institutions":[{"id":"https://openalex.org/I71999127","display_name":"Universitat de Barcelona","ror":"https://ror.org/021018s57","country_code":"ES","type":"education","lineage":["https://openalex.org/I71999127"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"M. Mart\u00ed","raw_affiliation_strings":["Universitat de Barcelona"],"affiliations":[{"raw_affiliation_string":"Universitat de Barcelona","institution_ids":["https://openalex.org/I71999127"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053947754","display_name":"Paolo Rosso","orcid":"https://orcid.org/0000-0002-8922-1242"},"institutions":[{"id":"https://openalex.org/I60053951","display_name":"Universitat Polit\u00e8cnica de Val\u00e8ncia","ror":"https://ror.org/01460j859","country_code":"ES","type":"education","lineage":["https://openalex.org/I60053951"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Paolo Rosso","raw_affiliation_strings":["Universitat Polit\u00e8cnica de Val\u00e8ncia"],"affiliations":[{"raw_affiliation_string":"Universitat Polit\u00e8cnica de Val\u00e8ncia","institution_ids":["https://openalex.org/I60053951"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5067489760"],"corresponding_institution_ids":["https://openalex.org/I9617848"],"apc_list":null,"apc_paid":null,"fwci":22.8972,"has_fulltext":false,"cited_by_count":148,"citation_normalized_percentile":{"value":0.99475737,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":"39","issue":"4","first_page":"917","last_page":"947"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11492","display_name":"Academic integrity and plagiarism","score":0.9901000261306763,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/paraphrase","display_name":"Paraphrase","score":0.9955134987831116},{"id":"https://openalex.org/keywords/plagiarism-detection","display_name":"Plagiarism detection","score":0.9113909006118774},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6548647284507751},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.48635679483413696},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.4538196623325348},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.43724897503852844},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.35960066318511963},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.12460982799530029}],"concepts":[{"id":"https://openalex.org/C2780922921","wikidata":"https://www.wikidata.org/wiki/Q255189","display_name":"Paraphrase","level":2,"score":0.9955134987831116},{"id":"https://openalex.org/C2780907237","wikidata":"https://www.wikidata.org/wiki/Q2986238","display_name":"Plagiarism detection","level":2,"score":0.9113909006118774},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6548647284507751},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.48635679483413696},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.4538196623325348},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43724897503852844},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.35960066318511963},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.12460982799530029}],"mesh":[],"locations_count":7,"locations":[{"id":"doi:10.1162/coli_a_00153","is_oa":false,"landing_page_url":"https://doi.org/10.1162/coli_a_00153","pdf_url":null,"source":{"id":"https://openalex.org/S155526855","display_name":"Computational Linguistics","issn_l":"0891-2017","issn":["0891-2017","1530-9312"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Linguistics","raw_type":"journal-article"},{"id":"pmh:oai:diposit.ub.edu:2445/49363","is_oa":false,"landing_page_url":"https://hdl.handle.net/2445/49363","pdf_url":null,"source":{"id":"https://openalex.org/S4306401653","display_name":"Dip\u00f2sit Digital de la Universitat de Barcelona (Universitat de Barcelona)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I71999127","host_organization_name":"Universitat de Barcelona","host_organization_lineage":["https://openalex.org/I71999127"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Articles publicats en revistes (Filologia Catalana i Ling\u00fc\u00edstica General)","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:upcommons.upc.edu:2117/20297","is_oa":true,"landing_page_url":"https://hdl.handle.net/2117/20297","pdf_url":null,"source":{"id":"https://openalex.org/S4210207057","display_name":"QRU Quaderns de Recerca en Urbanisme","issn_l":"2014-9689","issn":["2014-9689","2385-6777"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310322448","host_organization_name":"Q71272178","host_organization_lineage":["https://openalex.org/P4310322448"],"host_organization_lineage_names":["Q71272178"],"type":"journal"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"},{"id":"pmh:oai:www.recercat.cat:2072/265377","is_oa":true,"landing_page_url":"http://hdl.handle.net/2445/49363","pdf_url":"http://hdl.handle.net/2445/49363","source":{"id":"https://openalex.org/S4306402147","display_name":"RECERCAT (Consorci de Serveis Universitaris de Catalunya)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210090028","host_organization_name":"Consorci de Serveis Universitaris de Catalunya","host_organization_lineage":["https://openalex.org/I4210090028"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"},{"id":"pmh:oai:cris.unibo.it:11585/707696","is_oa":true,"landing_page_url":"http://hdl.handle.net/11585/707696","pdf_url":null,"source":{"id":"https://openalex.org/S4306402579","display_name":"Archivio istituzionale della ricerca (Alma Mater Studiorum Universit\u00e0 di Bologna)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210117483","host_organization_name":"Istituto di Ematologia di Bologna","host_organization_lineage":["https://openalex.org/I4210117483"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"},{"id":"pmh:oai:doaj.org/article:f3c540636d2143368ac263a0ef3f47af","is_oa":true,"landing_page_url":"https://doaj.org/article/f3c540636d2143368ac263a0ef3f47af","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Computational Linguistics, Vol 39, Iss 4 (2021)","raw_type":"article"},{"id":"pmh:oai:riunet.upv.es:10251/46317","is_oa":true,"landing_page_url":"http://hdl.handle.net/10251/46317","pdf_url":null,"source":{"id":"https://openalex.org/S4306401500","display_name":"RiuNet (Politechnical University of Valencia)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I60053951","host_organization_name":"Universitat Polit\u00e8cnica de Val\u00e8ncia","host_organization_lineage":["https://openalex.org/I60053951"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"pmh:oai:upcommons.upc.edu:2117/20297","is_oa":true,"landing_page_url":"https://hdl.handle.net/2117/20297","pdf_url":null,"source":{"id":"https://openalex.org/S4210207057","display_name":"QRU Quaderns de Recerca en Urbanisme","issn_l":"2014-9689","issn":["2014-9689","2385-6777"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310322448","host_organization_name":"Q71272178","host_organization_lineage":["https://openalex.org/P4310322448"],"host_organization_lineage_names":["Q71272178"],"type":"journal"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1974636337","display_name":null,"funder_award_id":"Fellowship","funder_id":"https://openalex.org/F4320321764","funder_display_name":"Ministerio de Educaci\u00f3n, Cultura y Deporte"},{"id":"https://openalex.org/G6199776388","display_name":null,"funder_award_id":"Spain","funder_id":"https://openalex.org/F4320321764","funder_display_name":"Ministerio de Educaci\u00f3n, Cultura y Deporte"},{"id":"https://openalex.org/G8589669012","display_name":null,"funder_award_id":"246016","funder_id":"https://openalex.org/F4320320885","funder_display_name":"European Research Consortium for Informatics and Mathematics"}],"funders":[{"id":"https://openalex.org/F4320320885","display_name":"European Research Consortium for Informatics and Mathematics","ror":"https://ror.org/055zrhj18"},{"id":"https://openalex.org/F4320321764","display_name":"Ministerio de Educaci\u00f3n, Cultura y Deporte","ror":"https://ror.org/03nc27g21"},{"id":"https://openalex.org/F4320322930","display_name":"Ministerio de Ciencia e Innovaci\u00f3n","ror":"https://ror.org/034900433"},{"id":"https://openalex.org/F4320334905","display_name":"Universitat Polit\u00e8cnica de Val\u00e8ncia","ror":"https://ror.org/01460j859"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":58,"referenced_works":["https://openalex.org/W54772338","https://openalex.org/W65010961","https://openalex.org/W78382366","https://openalex.org/W86855850","https://openalex.org/W88290828","https://openalex.org/W118736248","https://openalex.org/W123495503","https://openalex.org/W131533222","https://openalex.org/W147342296","https://openalex.org/W169106424","https://openalex.org/W257731206","https://openalex.org/W366513329","https://openalex.org/W587539298","https://openalex.org/W1483700983","https://openalex.org/W1536675587","https://openalex.org/W1544505227","https://openalex.org/W1563364218","https://openalex.org/W1564629710","https://openalex.org/W1600505241","https://openalex.org/W1974336599","https://openalex.org/W1980849679","https://openalex.org/W1987244517","https://openalex.org/W1992387162","https://openalex.org/W2008127487","https://openalex.org/W2028776121","https://openalex.org/W2034916234","https://openalex.org/W2039217078","https://openalex.org/W2065658084","https://openalex.org/W2069985874","https://openalex.org/W2091494174","https://openalex.org/W2101222922","https://openalex.org/W2107130271","https://openalex.org/W2118733980","https://openalex.org/W2123596227","https://openalex.org/W2124874361","https://openalex.org/W2127218421","https://openalex.org/W2129468719","https://openalex.org/W2129554311","https://openalex.org/W2134168908","https://openalex.org/W2138613338","https://openalex.org/W2149182189","https://openalex.org/W2169813772","https://openalex.org/W2171060541","https://openalex.org/W2237102846","https://openalex.org/W2280333896","https://openalex.org/W2284824783","https://openalex.org/W2299467264","https://openalex.org/W2340746501","https://openalex.org/W2596004617","https://openalex.org/W2605134814","https://openalex.org/W2607879133","https://openalex.org/W2892737606","https://openalex.org/W2905907858","https://openalex.org/W2978104984","https://openalex.org/W4229781645","https://openalex.org/W4230735677","https://openalex.org/W4237719669","https://openalex.org/W4292003697"],"related_works":["https://openalex.org/W3195775898","https://openalex.org/W4287024084","https://openalex.org/W2147528976","https://openalex.org/W2982625988","https://openalex.org/W4295159264","https://openalex.org/W2775899031","https://openalex.org/W2324328502","https://openalex.org/W2978707643","https://openalex.org/W4378713476","https://openalex.org/W4248451614"],"abstract_inverted_index":{"Although":[0],"paraphrasing":[1,46],"is":[2],"the":[3,19,43,77,93,103,113,144,148,159,163,166,178],"linguistic":[4],"mechanism":[5],"underlying":[6],"many":[7],"plagiarism":[8,23,27,59,67,98,136,170,182],"cases,":[9],"little":[10],"attention":[11,51],"has":[12],"been":[13,172],"paid":[14],"to":[15,32,52,88,157],"its":[16],"analysis":[17],"in":[18,73,112],"framework":[20],"of":[21,35,58,62,92,102,115,132,180],"automatic":[22,97,181],"detection.":[24,99],"Therefore,":[25],"state-of-the-art":[26],"detectors":[28],"find":[29],"it":[30],"difficult":[31],"detect":[33],"cases":[34],"paraphrase":[36,54,86,126,133,145,154,167],"plagiarism.":[37],"In":[38],"this":[39,71,116],"article,":[40],"we":[41,75],"analyze":[42],"relationship":[44],"between":[45],"and":[47,60,128,152],"plagiarism,":[48],"paying":[49],"special":[50],"which":[53,61],"phenomena":[55,127],"underlie":[56],"acts":[57],"them":[63],"are":[64,143],"detected":[65],"by":[66],"detection":[68,137,183],"systems.":[69,184],"With":[70],"aim":[72],"mind,":[74],"created":[76],"P4P":[78],"corpus,":[79],"a":[80,85,90,129],"new":[81],"resource":[82],"that":[83,122],"uses":[84],"typology":[87],"annotate":[89],"subset":[91],"PAN-PC-10":[94],"corpus":[95],"for":[96,177],"The":[100,118],"results":[101],"Second":[104],"International":[105],"Competition":[106],"on":[107],"Plagiarism":[108],"Detection":[109],"were":[110],"analyzed":[111],"light":[114],"annotation.":[117],"presented":[119],"experiments":[120],"show":[121],"(i)":[123],"more":[124,138],"complex":[125],"high":[130],"density":[131],"mechanisms":[134,146,155,168],"make":[135],"difficult,":[139],"(ii)":[140],"lexical":[141],"substitutions":[142],"used":[147],"most":[149],"when":[150],"plagiarizing,":[151],"(iii)":[153],"tend":[156],"shorten":[158],"plagiarized":[160],"text.":[161],"For":[162],"first":[164],"time,":[165],"behind":[169],"have":[171],"analyzed,":[173],"providing":[174],"critical":[175],"insights":[176],"improvement":[179]},"counts_by_year":[{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":10},{"year":2020,"cited_by_count":8},{"year":2019,"cited_by_count":27},{"year":2018,"cited_by_count":16},{"year":2017,"cited_by_count":16},{"year":2016,"cited_by_count":15},{"year":2015,"cited_by_count":20},{"year":2014,"cited_by_count":6},{"year":2013,"cited_by_count":5}],"updated_date":"2026-03-17T17:19:04.345684","created_date":"2016-06-24T00:00:00"}
