{"id":"https://openalex.org/W7134041084","doi":"https://doi.org/10.48550/arxiv.2603.05345","title":"A Multilingual Human Annotated Corpus of Original and Easy-to-Read Texts to Support Access to Democratic Participatory Processes","display_name":"A Multilingual Human Annotated Corpus of Original and Easy-to-Read Texts to Support Access to Democratic Participatory Processes","publication_year":2026,"publication_date":"2026-03-05","ids":{"openalex":"https://openalex.org/W7134041084","doi":"https://doi.org/10.48550/arxiv.2603.05345"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.05345","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5051720921","display_name":"Stefan Bott","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bott, Stefan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128227429","display_name":"Verena Riegler","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Riegler, Verena","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128249542","display_name":"Horacio Saggion","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Saggion, Horacio","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121821050","display_name":"Almudena Rasc\u00f3n Alcaina","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alcaina, Almudena Rasc\u00f3n","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128232186","display_name":"Nouran Khallaf","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Khallaf, Nouran","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12478","display_name":"Wikis in Education and Collaboration","score":0.00039999998989515007,"subfield":{"id":"https://openalex.org/subfields/3315","display_name":"Communication"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.0003000000142492354,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/catalan","display_name":"Catalan","score":0.7031000256538391},{"id":"https://openalex.org/keywords/corpus-linguistics","display_name":"Corpus linguistics","score":0.5967000126838684},{"id":"https://openalex.org/keywords/citizen-journalism","display_name":"Citizen journalism","score":0.46619999408721924},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.4424000084400177},{"id":"https://openalex.org/keywords/democracy","display_name":"Democracy","score":0.415800005197525},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4072999954223633}],"concepts":[{"id":"https://openalex.org/C164105321","wikidata":"https://www.wikidata.org/wiki/Q7026","display_name":"Catalan","level":2,"score":0.7031000256538391},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6883000135421753},{"id":"https://openalex.org/C532629269","wikidata":"https://www.wikidata.org/wiki/Q865083","display_name":"Corpus linguistics","level":2,"score":0.5967000126838684},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.510200023651123},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49709999561309814},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.4853000044822693},{"id":"https://openalex.org/C203663800","wikidata":"https://www.wikidata.org/wiki/Q848979","display_name":"Citizen journalism","level":2,"score":0.46619999408721924},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.4424000084400177},{"id":"https://openalex.org/C555826173","wikidata":"https://www.wikidata.org/wiki/Q7174","display_name":"Democracy","level":3,"score":0.415800005197525},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4072999954223633},{"id":"https://openalex.org/C2474386","wikidata":"https://www.wikidata.org/wiki/Q461183","display_name":"Text corpus","level":2,"score":0.36329999566078186},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.2980000078678131},{"id":"https://openalex.org/C182306322","wikidata":"https://www.wikidata.org/wiki/Q1779371","display_name":"Order (exchange)","level":2,"score":0.2808000147342682},{"id":"https://openalex.org/C94922259","wikidata":"https://www.wikidata.org/wiki/Q33215","display_name":"Constructed language","level":2,"score":0.2736999988555908},{"id":"https://openalex.org/C2993724205","wikidata":"https://www.wikidata.org/wiki/Q315","display_name":"Human language","level":2,"score":0.26350000500679016}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.05345","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2603.05345","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.05345","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.05345","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Being":[0],"able":[1],"to":[2,68,101,120,142,193],"understand":[3],"information":[4],"is":[5,16,31,50,147],"a":[6,10,74,167],"key":[7],"factor":[8],"for":[9,20,41,52,57,79,109,160,170],"self-determined":[11],"life":[12],"and":[13,44,64,135,172],"society.":[14],"It":[15,94,164],"also":[17,165],"very":[18],"important":[19],"participating":[21],"in":[22,91,183],"democratic":[23,110],"processes.":[24],"The":[25,112,123,145,186],"study":[26],"of":[27,37,76,105,157],"automatic":[28,47],"text":[29,92,127],"simplification":[30,86],"often":[32],"limited":[33],"by":[34,88],"the":[35,42,98,103,153,161,194],"availability":[36],"high":[38,84],"quality":[39,85],"material":[40],"training":[43],"evaluation":[45],"on":[46,131],"simplifiers.":[48],"This":[49],"true":[51],"English,":[53],"but":[54],"more":[55],"so":[56],"less":[58],"resourced":[59],"languages":[60],"like":[61],"Spanish,":[62],"Catalan":[63,162],"Italian.":[65],"In":[66],"order":[67],"fill":[69],"this":[70,121],"gap,":[71],"we":[72],"present":[73],"corpus":[75,124,146,156,187],"original":[77,113],"texts":[78,114,139],"these":[80,184],"3":[81],"languages,":[82],"with":[83],"produced":[87],"human":[89],"experts":[90],"simplification.":[93],"was":[95],"developed":[96],"within":[97],"iDEM":[99],"project":[100],"assess":[102],"impact":[104],"Easy-to-Read":[106],"(E2R)":[107],"language":[108,177],"participation.":[111],"were":[115,140],"compiled":[116],"from":[117],"domains":[118],"related":[119],"topic.":[122],"includes":[125,152],"different":[126],"types,":[128],"selected":[129],"based":[130],"relevance,":[132],"copyright":[133],"availability,":[134],"ethical":[136],"standards.":[137],"All":[138],"simplified":[141],"E2R":[143],"level.":[144],"particularity":[148],"valuable":[149],"because":[150],"it":[151],"first":[154],"annotated":[155],"its":[158],"kind":[159],"language.":[163],"represents":[166],"noteworthy":[168],"contribution":[169],"Spanish":[171],"Italian,":[173],"offering":[174],"high-quality,":[175],"human-annotated":[176],"resources":[178],"that":[179],"are":[180],"rarely":[181],"available":[182],"domains.":[185],"will":[188],"be":[189],"made":[190],"freely":[191],"accessible":[192],"public.":[195]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-07T00:00:00"}
