{"id":"https://openalex.org/W4407218606","doi":"https://doi.org/10.1186/s40537-025-01082-0","title":"Comparison of algorithms for the recognition of ChatGPT paraphrased texts","display_name":"Comparison of algorithms for the recognition of ChatGPT paraphrased texts","publication_year":2025,"publication_date":"2025-02-06","ids":{"openalex":"https://openalex.org/W4407218606","doi":"https://doi.org/10.1186/s40537-025-01082-0"},"language":"en","primary_location":{"id":"doi:10.1186/s40537-025-01082-0","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-025-01082-0","pdf_url":"https://link.springer.com/content/pdf/10.1186/s40537-025-01082-0.pdf","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://link.springer.com/content/pdf/10.1186/s40537-025-01082-0.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5083774363","display_name":"Aleksandar Kartelj","orcid":"https://orcid.org/0000-0001-9839-6039"},"institutions":[{"id":"https://openalex.org/I4068193","display_name":"University of Belgrade","ror":"https://ror.org/02qsmb048","country_code":"RS","type":"education","lineage":["https://openalex.org/I4068193"]}],"countries":["RS"],"is_corresponding":true,"raw_author_name":"Aleksandar Kartelj","raw_affiliation_strings":["Faculty of Mathematics, University of Belgrade, Studentski trg 16, Belgrade, 11000, Serbia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Mathematics, University of Belgrade, Studentski trg 16, Belgrade, 11000, Serbia","institution_ids":["https://openalex.org/I4068193"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102874859","display_name":"Miljana Mladenovi\u0107","orcid":"https://orcid.org/0000-0002-7973-452X"},"institutions":[{"id":"https://openalex.org/I152518017","display_name":"University of Nis","ror":"https://ror.org/00965bg92","country_code":"RS","type":"education","lineage":["https://openalex.org/I152518017"]}],"countries":["RS"],"is_corresponding":false,"raw_author_name":"Miljana Mladenovi\u0107","raw_affiliation_strings":["Faculty of Education, University of Ni\u0161, Partizanska 14, Vranje, 17500, Serbia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Education, University of Ni\u0161, Partizanska 14, Vranje, 17500, Serbia","institution_ids":["https://openalex.org/I152518017"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023658721","display_name":"Sta\u0161a Vuji\u010di\u0107 Stankovi\u0107","orcid":"https://orcid.org/0000-0002-7200-3724"},"institutions":[{"id":"https://openalex.org/I4068193","display_name":"University of Belgrade","ror":"https://ror.org/02qsmb048","country_code":"RS","type":"education","lineage":["https://openalex.org/I4068193"]}],"countries":["RS"],"is_corresponding":false,"raw_author_name":"Sta\u0161a Vuji\u010di\u0107 Stankovi\u0107","raw_affiliation_strings":["Faculty of Mathematics, University of Belgrade, Studentski trg 16, Belgrade, 11000, Serbia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Mathematics, University of Belgrade, Studentski trg 16, Belgrade, 11000, Serbia","institution_ids":["https://openalex.org/I4068193"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5083774363"],"corresponding_institution_ids":["https://openalex.org/I4068193"],"apc_list":{"value":1060,"currency":"GBP","value_usd":1300},"apc_paid":{"value":1060,"currency":"GBP","value_usd":1300},"fwci":10.7687,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.97705018,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"12","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9639000296592712,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9484999775886536,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8071998357772827},{"id":"https://openalex.org/keywords/computational-science-and-engineering","display_name":"Computational Science and Engineering","score":0.6030767560005188},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3891470432281494},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3735015392303467},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.35953080654144287},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.33567488193511963},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3312857747077942},{"id":"https://openalex.org/keywords/mathematics-education","display_name":"Mathematics education","score":0.3219642639160156},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.26172637939453125},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11917668581008911}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8071998357772827},{"id":"https://openalex.org/C68597687","wikidata":"https://www.wikidata.org/wiki/Q362601","display_name":"Computational Science and Engineering","level":2,"score":0.6030767560005188},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3891470432281494},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3735015392303467},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.35953080654144287},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.33567488193511963},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3312857747077942},{"id":"https://openalex.org/C145420912","wikidata":"https://www.wikidata.org/wiki/Q853077","display_name":"Mathematics education","level":1,"score":0.3219642639160156},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.26172637939453125},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11917668581008911}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1186/s40537-025-01082-0","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-025-01082-0","pdf_url":"https://link.springer.com/content/pdf/10.1186/s40537-025-01082-0.pdf","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:e41fa5df348c41b7aa9df76d9db53dc1","is_oa":true,"landing_page_url":"https://doaj.org/article/e41fa5df348c41b7aa9df76d9db53dc1","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of Big Data, Vol 12, Iss 1, Pp 1-17 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/s40537-025-01082-0","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-025-01082-0","pdf_url":"https://link.springer.com/content/pdf/10.1186/s40537-025-01082-0.pdf","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4407218606.pdf"},"referenced_works_count":6,"referenced_works":["https://openalex.org/W2585196369","https://openalex.org/W4311641658","https://openalex.org/W4386317922","https://openalex.org/W4388410460","https://openalex.org/W4390175962","https://openalex.org/W4391816278"],"related_works":["https://openalex.org/W2051487156","https://openalex.org/W2073681303","https://openalex.org/W4393232657","https://openalex.org/W2053286651","https://openalex.org/W4390638272","https://openalex.org/W2181743346","https://openalex.org/W2187401768","https://openalex.org/W2181413294","https://openalex.org/W2989452537","https://openalex.org/W2052122378"],"abstract_inverted_index":{"Abstract":[0],"The":[1,133],"rapid":[2],"development":[3],"of":[4,15,67,69,90,124,148,166,172,184,195,203,214,218,227,236],"artificial":[5],"intelligence,":[6],"especially":[7,35],"AI":[8],"assistants,":[9],"is":[10],"leading":[11],"to":[12,20,48,80,86,121,141,255,296],"new":[13,64],"forms":[14],"plagiarism":[16,51],"that":[17,178,201,224],"are":[18,191,210],"difficult":[19],"detect":[21,50],"using":[22],"existing":[23],"methods.":[24],"Paraphrasing":[25],"tools":[26,277],"make":[27],"this":[28],"problem":[29],"even":[30],"more":[31],"complex":[32],"and":[33,42,56,74,93,113,189,208,238,243,285,300],"challenging":[34],"in":[36,72,179,193,212,240,247,260,275,283],"minor":[37,261,290],"languages":[38,262,291],"with":[39,292],"inadequate":[40],"resources":[41],"tools.":[43,60],"This":[44],"study":[45],"explores":[46],"strategies":[47],"help":[49],"generated":[52],"by":[53,58],"ChatGPT":[54,81,129],"4.0":[55],"altered":[57],"paraphrasing":[59,258],"We":[61,97,250],"propose":[62],"two":[63,88,108],"datasets":[65,77,175,221],"consisting":[66],"abstracts":[68],"doctoral":[70],"theses":[71],"English":[73,137,198,241],"Serbian.":[75,265],"Both":[76],"were":[78,160],"subjected":[79],"paraphrasing,":[82],"which":[83],"allowed":[84],"us":[85],"form":[87],"classes":[89],"texts:":[91],"human-written":[92],"AI-generated,":[94],"i.e.,":[95],"AI-paraphrased.":[96],"then":[98],"comprehensively":[99],"compare":[100,119],"19":[101],"widely":[102],"used":[103],"classification":[104],"algorithms":[105],"based":[106],"on":[107,135,156],"feature":[109],"sets:":[110],"word":[111],"unigrams":[112],"character":[114],"multigrams.":[115],"In":[116,152],"addition,":[117],"we":[118],"these":[120,253],"the":[122,136,154,157,173,187,206,219,225,228,269],"results":[123,134,155],"a":[125],"commercially":[126],"available":[127],"pre-trained":[128],"content":[130,298],"detector,":[131],"ZeroGPT.":[132],"corpus":[138,159],"turn":[139],"out":[140],"be":[142],"very":[143],"accurate,":[144,162],"achieving":[145,163],"an":[146,164],"accuracy":[147,165],"95%":[149],"or":[150,245],"more.":[151],"contrast,":[153],"Serbian":[158,180,248],"less":[161],"just":[167],"over":[168],"85%.":[169],"Syntax":[170,216],"analysis":[171,217],"training":[174],"has":[176,222],"shown":[177,223],"GPT-paraphrased":[181,197],"texts,":[182],"33.2%":[183],"sentences":[185,204],"remain":[186,205],"same,":[188,207],"they":[190,209],"found":[192,211],"63%":[194],"documents.":[196,215],"texts":[199,242,282],"showed":[200],"3.2%":[202],"16%":[213],"test":[220],"change":[226],"model":[229],"temperature":[230],"influences":[231],"syntactic":[232],"features":[233],"(average":[234],"number":[235],"words":[237],"sentences)":[239],"slightly":[244],"not":[246],"texts.":[249],"attribute":[251],"all":[252],"differences":[254],"GPT\u2019s":[256],"lower":[257],"ability":[259],"such":[263],"as":[264],"Presented":[266],"findings":[267],"underscore":[268],"necessity":[270],"for":[271,279,289],"making":[272],"persistent":[273],"effort":[274],"developing":[276],"made":[278],"detecting":[280],"AI-paraphrased":[281],"academic":[284],"professional":[286],"settings,":[287],"particularly":[288],"limited":[293],"NLP":[294],"resources,":[295],"preserve":[297],"integrity":[299],"authenticity.":[301]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4}],"updated_date":"2026-04-26T08:31:28.666265","created_date":"2025-10-10T00:00:00"}
