{"id":"https://openalex.org/W4393515868","doi":"https://doi.org/10.5281/zenodo.4639616","title":"CLiPS Stylometry Investigation (CSI) Corpus","display_name":"CLiPS Stylometry Investigation (CSI) Corpus","publication_year":2015,"publication_date":"2015-10-01","ids":{"openalex":"https://openalex.org/W4393515868","doi":"https://doi.org/10.5281/zenodo.4639616"},"language":"en","primary_location":{"id":"pmh:oai:zenodo.org:4639616","is_oa":true,"landing_page_url":"https://zenodo.org/record/4639616","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/other"},"type":"dataset","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://zenodo.org/record/4639616","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012428119","display_name":"Ben Verhoeven","orcid":"https://orcid.org/0000-0003-0320-8256"},"institutions":[{"id":"https://openalex.org/I149213910","display_name":"University of Antwerp","ror":"https://ror.org/008x57b05","country_code":"BE","type":"education","lineage":["https://openalex.org/I149213910"]}],"countries":["BE"],"is_corresponding":true,"raw_author_name":"Verhoeven, Ben","raw_affiliation_strings":["CLiPS Research Center, University of Antwerp"],"raw_orcid":"https://orcid.org/0000-0003-0320-8256","affiliations":[{"raw_affiliation_string":"CLiPS Research Center, University of Antwerp","institution_ids":["https://openalex.org/I149213910"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083411784","display_name":"Walter Daelemans","orcid":"https://orcid.org/0000-0002-9832-7890"},"institutions":[{"id":"https://openalex.org/I149213910","display_name":"University of Antwerp","ror":"https://ror.org/008x57b05","country_code":"BE","type":"education","lineage":["https://openalex.org/I149213910"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Daelemans, Walter","raw_affiliation_strings":["CLiPS Research Center, University of Antwerp"],"raw_orcid":"https://orcid.org/0000-0002-9832-7890","affiliations":[{"raw_affiliation_string":"CLiPS Research Center, University of Antwerp","institution_ids":["https://openalex.org/I149213910"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5012428119"],"corresponding_institution_ids":["https://openalex.org/I149213910"],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.4805000126361847,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.4805000126361847,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/stylometry","display_name":"Stylometry","score":0.9047592282295227},{"id":"https://openalex.org/keywords/clips","display_name":"CLIPS","score":0.8016058206558228},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.44588035345077515},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.441297709941864},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32284343242645264}],"concepts":[{"id":"https://openalex.org/C11192451","wikidata":"https://www.wikidata.org/wiki/Q2032038","display_name":"Stylometry","level":2,"score":0.9047592282295227},{"id":"https://openalex.org/C2778739407","wikidata":"https://www.wikidata.org/wiki/Q165372","display_name":"CLIPS","level":2,"score":0.8016058206558228},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.44588035345077515},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.441297709941864},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32284343242645264}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:zenodo.org:4639616","is_oa":true,"landing_page_url":"https://zenodo.org/record/4639616","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/other"},{"id":"doi:10.5281/zenodo.4639616","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.4639616","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"dataset"}],"best_oa_location":{"id":"pmh:oai:zenodo.org:4639616","is_oa":true,"landing_page_url":"https://zenodo.org/record/4639616","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/other"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2417253731","https://openalex.org/W2350469024","https://openalex.org/W2491583298","https://openalex.org/W2036154621","https://openalex.org/W2327827625","https://openalex.org/W2395860100","https://openalex.org/W795077857","https://openalex.org/W2376416463","https://openalex.org/W3204019825"],"abstract_inverted_index":{"The":[0,17,62],"CSI":[1],"corpus":[2,7,21,67,77],"is":[3,33],"a":[4,34],"yearly":[5],"expanded":[6],"of":[8,19,37,49,65,75],"student":[9],"texts":[10],"in":[11,24,70],"two":[12],"genres:":[13],"essays":[14],"and":[15,53],"reviews.":[16],"purpose":[18],"this":[20],"lies":[22],"primarily":[23],"stylometric":[25],"research,":[26],"but":[27],"other":[28],"applications":[29],"are":[30,78],"possible.":[31],"There":[32],"vast":[35],"amount":[36],"meta-data":[38],"available,":[39],"both":[40],"on":[41,54],"the":[42,55,66,76,81],"author":[43],"(gender,":[44],"age,":[45],"sexual":[46],"orientation,":[47],"region":[48],"origin,":[50],"personality":[51],"profile)":[52],"document":[56],"(timestamp,":[57],"genre,":[58],"veracity,":[59],"sentiment,":[60],"grade).":[61],"current":[63],"version":[64],"was":[68],"assembled":[69],"February":[71],"2016.":[72],"Previous":[73],"versions":[74],"available":[79],"from":[80],"authors":[82],"via":[83],"e-mail":[84],"request.":[85]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
