{"id":"https://openalex.org/W7140137853","doi":"https://doi.org/10.18653/v1/2026.eacl-demo.6","title":"DELTA: A Toolkit for Measuring Linguistic Diversity in Dependency-Parsed Corpora","display_name":"DELTA: A Toolkit for Measuring Linguistic Diversity in Dependency-Parsed Corpora","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7140137853","doi":"https://doi.org/10.18653/v1/2026.eacl-demo.6"},"language":null,"primary_location":{"id":"doi:10.18653/v1/2026.eacl-demo.6","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2026.eacl-demo.6","pdf_url":"https://aclanthology.org/2026.eacl-demo.6.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th Conference of the European Chapter of the Association for Computational Linguistics (Volume 3: System Demonstrations)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2026.eacl-demo.6.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101230899","display_name":"Louis Est\u00e8ve","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Louis Est\u00e8ve","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130341945","display_name":"Kaja Dobrovoljc","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kaja Dobrovoljc","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.4009097,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"75","last_page":"85"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.6243000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.6243000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.0632999986410141,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.03700000047683716,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/diversity","display_name":"Diversity (politics)","score":0.3750999867916107},{"id":"https://openalex.org/keywords/linguistic-diversity","display_name":"Linguistic diversity","score":0.3312000036239624},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.299699991941452},{"id":"https://openalex.org/keywords/computational-linguistics","display_name":"Computational linguistics","score":0.28929999470710754},{"id":"https://openalex.org/keywords/corpus-linguistics","display_name":"Corpus linguistics","score":0.2833000123500824}],"concepts":[{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.614799976348877},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.588100016117096},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5006999969482422},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4336000084877014},{"id":"https://openalex.org/C2781316041","wikidata":"https://www.wikidata.org/wiki/Q1230584","display_name":"Diversity (politics)","level":2,"score":0.3750999867916107},{"id":"https://openalex.org/C2992249680","wikidata":"https://www.wikidata.org/wiki/Q315","display_name":"Linguistic diversity","level":2,"score":0.3312000036239624},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.299699991941452},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.28929999470710754},{"id":"https://openalex.org/C532629269","wikidata":"https://www.wikidata.org/wiki/Q865083","display_name":"Corpus linguistics","level":2,"score":0.2833000123500824},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.2671999931335449}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2026.eacl-demo.6","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2026.eacl-demo.6","pdf_url":"https://aclanthology.org/2026.eacl-demo.6.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th Conference of the European Chapter of the Association for Computational Linguistics (Volume 3: System Demonstrations)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2026.eacl-demo.6","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2026.eacl-demo.6","pdf_url":"https://aclanthology.org/2026.eacl-demo.6.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th Conference of the European Chapter of the Association for Computational Linguistics (Volume 3: System Demonstrations)","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.5039202570915222}],"awards":[{"id":"https://openalex.org/G7554473891","display_name":"SEmantic LEXicon INduction for Interpretability and diversity in text processing","funder_award_id":"ANR-21-CE23-0033","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"}],"funders":[{"id":"https://openalex.org/F4320320883","display_name":"Agence Nationale de la Recherche","ror":"https://ror.org/00rbzpz17"},{"id":"https://openalex.org/F4320324252","display_name":"Universit\u00e9 Paris-Saclay","ror":"https://ror.org/03xjwb503"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7140137853.pdf","grobid_xml":"https://content.openalex.org/works/W7140137853.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Despite":[0],"growing":[1],"interest":[2],"in":[3],"measuring":[4,26],"linguistic":[5,31,60],"diversity":[6,28,53,68,110],"on":[7,20,33,96],"the":[8,12,21,27,82],"one":[9],"hand":[10],"and":[11,66,108],"increasing":[13],"availability":[14],"of":[15,29,90],"cross-linguistically":[16],"comparable":[17],"parsed":[18],"corpora":[19,77],"other,":[22],"tools":[23],"for":[24,105],"systematically":[25],"specific":[30,91],"phenomena":[32],"such":[34],"data":[35],"remain":[36],"limited.To":[37],"address":[38],"this":[39],"gap,":[40],"we":[41],"present":[42],"DELTA,":[43],"an":[44],"open-source":[45],"framework":[46],"that":[47],"integrates":[48],"dependency":[49],"tree":[50],"querying":[51],"with":[52],"computation,":[54],"enabling":[55],"systematic":[56],"measurement":[57],"across":[58],"multiple":[59,67],"levels":[61],"(e.g.,":[62],"lexis,":[63],"morphology,":[64],"syntax)":[65],"dimensions":[69],"(variety,":[70],"balance,":[71],"disparity).The":[72],"pipeline":[73],"processes":[74],"CoNLL-U":[75],"formatted":[76],"through":[78],"configurable":[79],"workflows,":[80],"treating":[81],"format":[83],"as":[84],"a":[85],"general-purpose":[86],"tabular":[87],"structure":[88],"independent":[89],"annotation":[92],"conventions.We":[93],"validate":[94],"DELTA":[95],"Parallel":[97],"Universal":[98],"Dependencies":[99],"multilingual":[100],"dataset,":[101],"demonstrating":[102],"its":[103],"capacity":[104],"corpus":[106],"profiling":[107],"cross-corpus":[109],"comparison.":[111]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-24T00:00:00"}
