{"id":"https://openalex.org/W1494542529","doi":"https://doi.org/10.1007/978-3-642-16761-4_3","title":"Towards Document Plagiarism Detection Based on the Relevance and Fragmentation of the Reused Text","display_name":"Towards Document Plagiarism Detection Based on the Relevance and Fragmentation of the Reused Text","publication_year":2010,"publication_date":"2010-01-01","ids":{"openalex":"https://openalex.org/W1494542529","doi":"https://doi.org/10.1007/978-3-642-16761-4_3","mag":"1494542529"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-642-16761-4_3","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-642-16761-4_3","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055252239","display_name":"Fernando S\u00e1nchez-Vega","orcid":"https://orcid.org/0000-0002-8533-2818"},"institutions":[{"id":"https://openalex.org/I39824353","display_name":"National Institute of Astrophysics, Optics and Electronics","ror":"https://ror.org/00bpmmc63","country_code":"MX","type":"facility","lineage":["https://openalex.org/I39824353"]}],"countries":["MX"],"is_corresponding":true,"raw_author_name":"Fernando S\u00e1nchez-Vega","raw_affiliation_strings":["Laboratory of Language Technologies, Department of Computational Sciences, National Institute of Astrophysics, Optics and Electronics (INAOE), Mexico"],"affiliations":[{"raw_affiliation_string":"Laboratory of Language Technologies, Department of Computational Sciences, National Institute of Astrophysics, Optics and Electronics (INAOE), Mexico","institution_ids":["https://openalex.org/I39824353"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053929522","display_name":"Luis Villase\u00f1or-Pineda","orcid":"https://orcid.org/0000-0003-1294-9128"},"institutions":[{"id":"https://openalex.org/I39824353","display_name":"National Institute of Astrophysics, Optics and Electronics","ror":"https://ror.org/00bpmmc63","country_code":"MX","type":"facility","lineage":["https://openalex.org/I39824353"]}],"countries":["MX"],"is_corresponding":false,"raw_author_name":"Luis Villase\u00f1or-Pineda","raw_affiliation_strings":["Laboratory of Language Technologies, Department of Computational Sciences, National Institute of Astrophysics, Optics and Electronics (INAOE), Mexico"],"affiliations":[{"raw_affiliation_string":"Laboratory of Language Technologies, Department of Computational Sciences, National Institute of Astrophysics, Optics and Electronics (INAOE), Mexico","institution_ids":["https://openalex.org/I39824353"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050780136","display_name":"Manuel Montes-y-G\u00f3mez","orcid":"https://orcid.org/0000-0002-7601-501X"},"institutions":[{"id":"https://openalex.org/I17301866","display_name":"University of Alabama","ror":"https://ror.org/03xrrjk67","country_code":"US","type":"education","lineage":["https://openalex.org/I17301866"]},{"id":"https://openalex.org/I39824353","display_name":"National Institute of Astrophysics, Optics and Electronics","ror":"https://ror.org/00bpmmc63","country_code":"MX","type":"facility","lineage":["https://openalex.org/I39824353"]}],"countries":["MX","US"],"is_corresponding":false,"raw_author_name":"Manuel Montes-y-G\u00f3mez","raw_affiliation_strings":["Department of Computer and Information Sciences, University of Alabama, Birmingham, Mexico","Laboratory of Language Technologies, Department of Computational Sciences, National Institute of Astrophysics, Optics and Electronics (INAOE), Mexico"],"affiliations":[{"raw_affiliation_string":"Department of Computer and Information Sciences, University of Alabama, Birmingham, Mexico","institution_ids":["https://openalex.org/I17301866"]},{"raw_affiliation_string":"Laboratory of Language Technologies, Department of Computational Sciences, National Institute of Astrophysics, Optics and Electronics (INAOE), Mexico","institution_ids":["https://openalex.org/I39824353"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053947754","display_name":"Paolo Rosso","orcid":"https://orcid.org/0000-0002-8922-1242"},"institutions":[{"id":"https://openalex.org/I60053951","display_name":"Universitat Polit\u00e8cnica de Val\u00e8ncia","ror":"https://ror.org/01460j859","country_code":"ES","type":"education","lineage":["https://openalex.org/I60053951"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Paolo Rosso","raw_affiliation_strings":["Natural Language Engineering Lab, ELiRF, DSIC, Universidad Polit\u00e9cnica de Valencia, Spain"],"affiliations":[{"raw_affiliation_string":"Natural Language Engineering Lab, ELiRF, DSIC, Universidad Polit\u00e9cnica de Valencia, Spain","institution_ids":["https://openalex.org/I60053951"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5055252239"],"corresponding_institution_ids":["https://openalex.org/I39824353"],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":null,"fwci":1.4161,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.81481198,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"24","last_page":"31"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11492","display_name":"Academic integrity and plagiarism","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/plagiarism-detection","display_name":"Plagiarism detection","score":0.8431394696235657},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7417284250259399},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.6337317228317261},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5467913150787354},{"id":"https://openalex.org/keywords/fragmentation","display_name":"Fragmentation (computing)","score":0.5138716697692871},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.44388478994369507},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.44020673632621765},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4349970519542694},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.41998058557510376},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37207821011543274},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.10666003823280334},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.0672808289527893}],"concepts":[{"id":"https://openalex.org/C2780907237","wikidata":"https://www.wikidata.org/wiki/Q2986238","display_name":"Plagiarism detection","level":2,"score":0.8431394696235657},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7417284250259399},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.6337317228317261},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5467913150787354},{"id":"https://openalex.org/C191015642","wikidata":"https://www.wikidata.org/wiki/Q1132459","display_name":"Fragmentation (computing)","level":2,"score":0.5138716697692871},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.44388478994369507},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.44020673632621765},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4349970519542694},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.41998058557510376},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37207821011543274},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.10666003823280334},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0672808289527893},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/978-3-642-16761-4_3","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-642-16761-4_3","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.386.3853","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.386.3853","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://ccc.inaoep.mx/~mmontesg/publicaciones/2010/PlagarishmDetection-MICAI10.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W1555414055","https://openalex.org/W1570448133","https://openalex.org/W1589844230","https://openalex.org/W1967043694","https://openalex.org/W1974336599","https://openalex.org/W2118020653","https://openalex.org/W2149182189","https://openalex.org/W2297579780","https://openalex.org/W2335634178","https://openalex.org/W2339626475","https://openalex.org/W2340746501","https://openalex.org/W2603144157","https://openalex.org/W2905907858","https://openalex.org/W2966207845"],"related_works":["https://openalex.org/W4287126803","https://openalex.org/W3168266056","https://openalex.org/W4250737080","https://openalex.org/W2112890327","https://openalex.org/W2735162248","https://openalex.org/W311440260","https://openalex.org/W2945111072","https://openalex.org/W1496191935","https://openalex.org/W2132239106","https://openalex.org/W3080940603"],"abstract_inverted_index":null,"counts_by_year":[{"year":2015,"cited_by_count":1},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
