{"id":"https://openalex.org/W2944226280","doi":"https://doi.org/10.1017/s1351324919000056","title":"Annotating a broad range of anaphoric phenomena, in a variety of genres: the ARRAU Corpus","display_name":"Annotating a broad range of anaphoric phenomena, in a variety of genres: the ARRAU Corpus","publication_year":2019,"publication_date":"2019-05-07","ids":{"openalex":"https://openalex.org/W2944226280","doi":"https://doi.org/10.1017/s1351324919000056","mag":"2944226280"},"language":"en","primary_location":{"id":"doi:10.1017/s1351324919000056","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s1351324919000056","pdf_url":null,"source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011044971","display_name":"Olga Uryupina","orcid":"https://orcid.org/0000-0003-0504-2827"},"institutions":[{"id":"https://openalex.org/I193223587","display_name":"University of Trento","ror":"https://ror.org/05trd4x28","country_code":"IT","type":"education","lineage":["https://openalex.org/I193223587"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Olga Uryupina","raw_affiliation_strings":["Department of Information Engineering and Computer Science, University of Trento"],"affiliations":[{"raw_affiliation_string":"Department of Information Engineering and Computer Science, University of Trento","institution_ids":["https://openalex.org/I193223587"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051313364","display_name":"Ron Artstein","orcid":"https://orcid.org/0009-0005-5187-6381"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]},{"id":"https://openalex.org/I4210087747","display_name":"Creative Technologies (United States)","ror":"https://ror.org/001qkb777","country_code":"US","type":"company","lineage":["https://openalex.org/I4210087747"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ron Artstein","raw_affiliation_strings":["Institute for Creative Technologies, University of Southern California"],"affiliations":[{"raw_affiliation_string":"Institute for Creative Technologies, University of Southern California","institution_ids":["https://openalex.org/I4210087747","https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017580022","display_name":"Antonella Bristot","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Antonella Bristot","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079503351","display_name":"Federica Cavicchio","orcid":"https://orcid.org/0000-0002-2795-8396"},"institutions":[{"id":"https://openalex.org/I91203450","display_name":"University of Haifa","ror":"https://ror.org/02f009v59","country_code":"IL","type":"education","lineage":["https://openalex.org/I91203450"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Federica Cavicchio","raw_affiliation_strings":["Sign Language Lab, University of Haifa"],"affiliations":[{"raw_affiliation_string":"Sign Language Lab, University of Haifa","institution_ids":["https://openalex.org/I91203450"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014332510","display_name":"Francesca Delogu","orcid":"https://orcid.org/0000-0002-8158-126X"},"institutions":[{"id":"https://openalex.org/I91712215","display_name":"Saarland University","ror":"https://ror.org/01jdpyv68","country_code":"DE","type":"education","lineage":["https://openalex.org/I91712215"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Francesca Delogu","raw_affiliation_strings":["Department of Computational Linguistics & Phonetics, Saarland University"],"affiliations":[{"raw_affiliation_string":"Department of Computational Linguistics & Phonetics, Saarland University","institution_ids":["https://openalex.org/I91712215"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013986373","display_name":"Kepa Joseba Rodr\u00edguez","orcid":"https://orcid.org/0000-0003-2366-6764"},"institutions":[{"id":"https://openalex.org/I4210111254","display_name":"American Society for Yad Vashem","ror":"https://ror.org/01s8e3v68","country_code":"US","type":"archive","lineage":["https://openalex.org/I4210111254"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kepa J. Rodriguez","raw_affiliation_strings":["Archives Division, Yad Vashem"],"affiliations":[{"raw_affiliation_string":"Archives Division, Yad Vashem","institution_ids":["https://openalex.org/I4210111254"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047065550","display_name":"Massimo Poesio","orcid":"https://orcid.org/0000-0001-8469-2072"},"institutions":[{"id":"https://openalex.org/I166337079","display_name":"Queen Mary University of London","ror":"https://ror.org/026zzn846","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I166337079"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Massimo Poesio","raw_affiliation_strings":["School of Electronic Engineering and Computer Science, Queen Mary University of London"],"affiliations":[{"raw_affiliation_string":"School of Electronic Engineering and Computer Science, Queen Mary University of London","institution_ids":["https://openalex.org/I166337079"]}]}],"institutions":[],"countries_distinct_count":5,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5011044971"],"corresponding_institution_ids":["https://openalex.org/I193223587"],"apc_list":null,"apc_paid":null,"fwci":4.3405,"has_fulltext":false,"cited_by_count":44,"citation_normalized_percentile":{"value":0.95454909,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"26","issue":"1","first_page":"95","last_page":"128"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8981236219406128},{"id":"https://openalex.org/keywords/coreference","display_name":"Coreference","score":0.8927440643310547},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.7036275863647461},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6771703362464905},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.6462422013282776},{"id":"https://openalex.org/keywords/anaphora","display_name":"Anaphora (linguistics)","score":0.6297036409378052},{"id":"https://openalex.org/keywords/bridging","display_name":"Bridging (networking)","score":0.6113969087600708},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6038387417793274},{"id":"https://openalex.org/keywords/ambiguity","display_name":"Ambiguity","score":0.5872257351875305},{"id":"https://openalex.org/keywords/resolution","display_name":"Resolution (logic)","score":0.4750426113605499},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.3906145393848419},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.06367582082748413}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8981236219406128},{"id":"https://openalex.org/C28076734","wikidata":"https://www.wikidata.org/wiki/Q63087","display_name":"Coreference","level":3,"score":0.8927440643310547},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.7036275863647461},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6771703362464905},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.6462422013282776},{"id":"https://openalex.org/C2781449363","wikidata":"https://www.wikidata.org/wiki/Q156751","display_name":"Anaphora (linguistics)","level":3,"score":0.6297036409378052},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.6113969087600708},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6038387417793274},{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.5872257351875305},{"id":"https://openalex.org/C138268822","wikidata":"https://www.wikidata.org/wiki/Q1051925","display_name":"Resolution (logic)","level":2,"score":0.4750426113605499},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.3906145393848419},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.06367582082748413},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1017/s1351324919000056","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s1351324919000056","pdf_url":null,"source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"},{"id":"pmh:oai:iris.unitn.it:11572/295823","is_oa":false,"landing_page_url":"http://hdl.handle.net/11572/295823","pdf_url":null,"source":{"id":"https://openalex.org/S4306401913","display_name":"Institutional Research Information System (Universit\u00e0 degli Studi di Trento)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I193223587","host_organization_name":"University of Trento","host_organization_lineage":["https://openalex.org/I193223587"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"},{"id":"pmh:oai:qmro.qmul.ac.uk:123456789/58236","is_oa":false,"landing_page_url":"https://qmro.qmul.ac.uk/xmlui/handle/123456789/58236","pdf_url":null,"source":{"id":"https://openalex.org/S4306400530","display_name":"Queen Mary Research Online (Queen Mary University of London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I166337079","host_organization_name":"Queen Mary University of London","host_organization_lineage":["https://openalex.org/I166337079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6100000143051147,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":124,"referenced_works":["https://openalex.org/W87744087","https://openalex.org/W101214240","https://openalex.org/W116192430","https://openalex.org/W117665274","https://openalex.org/W176450450","https://openalex.org/W186897643","https://openalex.org/W203496455","https://openalex.org/W245306944","https://openalex.org/W261263179","https://openalex.org/W346329221","https://openalex.org/W576550507","https://openalex.org/W1207343383","https://openalex.org/W1489011351","https://openalex.org/W1489737627","https://openalex.org/W1519642432","https://openalex.org/W1528859321","https://openalex.org/W1560781570","https://openalex.org/W1577423537","https://openalex.org/W1579572287","https://openalex.org/W1593410987","https://openalex.org/W1632114991","https://openalex.org/W1755099827","https://openalex.org/W1826363161","https://openalex.org/W1865007823","https://openalex.org/W1964803238","https://openalex.org/W1967545963","https://openalex.org/W1971218560","https://openalex.org/W1972707925","https://openalex.org/W1974358919","https://openalex.org/W1980366261","https://openalex.org/W1989485152","https://openalex.org/W1996720934","https://openalex.org/W2006873020","https://openalex.org/W2007709031","https://openalex.org/W2028953697","https://openalex.org/W2033517582","https://openalex.org/W2035500771","https://openalex.org/W2044599851","https://openalex.org/W2052286186","https://openalex.org/W2053670600","https://openalex.org/W2061970800","https://openalex.org/W2066832356","https://openalex.org/W2077670769","https://openalex.org/W2082024724","https://openalex.org/W2082802837","https://openalex.org/W2083905610","https://openalex.org/W2101268022","https://openalex.org/W2105067765","https://openalex.org/W2121636384","https://openalex.org/W2122906199","https://openalex.org/W2141510042","https://openalex.org/W2141766660","https://openalex.org/W2142450061","https://openalex.org/W2147218300","https://openalex.org/W2149392590","https://openalex.org/W2153222072","https://openalex.org/W2153367954","https://openalex.org/W2153804780","https://openalex.org/W2155069789","https://openalex.org/W2157826122","https://openalex.org/W2158847908","https://openalex.org/W2161876018","https://openalex.org/W2164632894","https://openalex.org/W2165086233","https://openalex.org/W2165178592","https://openalex.org/W2170524863","https://openalex.org/W2171522936","https://openalex.org/W2171549925","https://openalex.org/W2179205908","https://openalex.org/W2180160918","https://openalex.org/W2180284103","https://openalex.org/W2182296156","https://openalex.org/W2250668331","https://openalex.org/W2250738489","https://openalex.org/W2250862915","https://openalex.org/W2250947630","https://openalex.org/W2251035762","https://openalex.org/W2251064706","https://openalex.org/W2251145093","https://openalex.org/W2251262458","https://openalex.org/W2251435592","https://openalex.org/W2251489622","https://openalex.org/W2251546258","https://openalex.org/W2251645852","https://openalex.org/W2252219904","https://openalex.org/W2252247041","https://openalex.org/W2343954916","https://openalex.org/W2407338347","https://openalex.org/W2476913205","https://openalex.org/W2485208606","https://openalex.org/W2491412609","https://openalex.org/W2506588123","https://openalex.org/W2514130906","https://openalex.org/W2561094137","https://openalex.org/W2572114200","https://openalex.org/W2575233155","https://openalex.org/W2575987980","https://openalex.org/W2576227650","https://openalex.org/W2612560781","https://openalex.org/W2627068020","https://openalex.org/W2738152205","https://openalex.org/W2756694897","https://openalex.org/W2805159201","https://openalex.org/W2805589998","https://openalex.org/W2912629390","https://openalex.org/W2962769558","https://openalex.org/W2963442673","https://openalex.org/W3126470093","https://openalex.org/W3209447568","https://openalex.org/W4205177836","https://openalex.org/W4238778312","https://openalex.org/W4244319398","https://openalex.org/W4250641076","https://openalex.org/W6604118639","https://openalex.org/W6631605494","https://openalex.org/W6633703549","https://openalex.org/W6636649193","https://openalex.org/W6675923148","https://openalex.org/W6681036856","https://openalex.org/W6681085189","https://openalex.org/W6682780409","https://openalex.org/W6683017610","https://openalex.org/W6744435112","https://openalex.org/W7051765020"],"related_works":["https://openalex.org/W3121962060","https://openalex.org/W54903681","https://openalex.org/W2891854054","https://openalex.org/W2361342447","https://openalex.org/W2114481423","https://openalex.org/W4206648670","https://openalex.org/W1578225302","https://openalex.org/W2251535201","https://openalex.org/W2805436235","https://openalex.org/W188948849"],"abstract_inverted_index":{"Abstract":[0],"This":[1],"paper":[2],"presents":[3],"the":[4,24,53,102,129,148,152,171,174],"second":[5,183],"release":[6,176],"of":[7,13,27,34,50,73,81,91,105,111,128,151,162,177],"arrau":[8,51,178],",":[9],"a":[10,89,108,160],"multigenre":[11],"corpus":[12],"anaphoric":[14,112,123],"information":[15],"created":[16],"over":[17],"10":[18],"years":[19],"to":[20,98],"provide":[21],"data":[22],"for":[23],"next":[25],"generation":[26],"coreference/anaphora":[28],"resolution":[29],"systems":[30],"combining":[31],"different":[32],"types":[33],"linguistic":[35,45],"and":[36,63,75,117,134,164,167,181],"world":[37],"knowledge":[38],"with":[39],"advanced":[40],"discourse":[41,118],"modeling":[42],"supporting":[43],"rich":[44],"annotations.":[46],"The":[47,125],"distinguishing":[48,69,149],"features":[49,150],"include":[52],"following:":[54],"treating":[55],"all":[56,147],"NPs":[57],"as":[58],"markables,":[59],"including":[60,114],"non-referring":[61],"NPs,":[62],"annotating":[64,76,88,101,107,122],"their":[65],"(non-)":[66],"referentiality":[67],"status;":[68],"between":[70,173],"several":[71],"categories":[72],"non-referentiality":[74],"non-anaphoric":[77],"mentions;":[78,106],"thorough":[79],"annotation":[80],"markable":[82],"boundaries":[83],"(minimal/maximal":[84],"spans,":[85],"discontinuous":[86],"markables);":[87],"variety":[90],"mention":[92],"attributes,":[93],"ranging":[94],"from":[95,138],"morphosyntactic":[96],"parameters":[97],"semantic":[99],"category;":[100],"genericity":[103],"status":[104],"wide":[109],"range":[110],"relations,":[113],"bridging":[115],"relations":[116],"deixis;":[119],"and,":[120],"finally,":[121],"ambiguity.":[124],"current":[126],"version":[127],"dataset":[130],"contains":[131],"350K":[132],"tokens":[133],"is":[135],"publicly":[136],"available":[137],"LDC.":[139],"In":[140],"this":[141,182],"paper,":[142],"we":[143,168],"discuss":[144,170],"in":[145,159,179],"detail":[146],"corpus,":[153],"so":[154],"far":[155],"only":[156],"partially":[157],"presented":[158],"number":[161],"conference":[163],"workshop":[165],"papers,":[166],"also":[169],"development":[172],"first":[175],"2008":[180],"one.":[184]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2023,"cited_by_count":9},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":13},{"year":2020,"cited_by_count":8},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
