{"id":"https://openalex.org/W4379013364","doi":"https://doi.org/10.1017/s1351324923000220","title":"Polish natural language inference and factivity: An expert-based dataset and benchmarks","display_name":"Polish natural language inference and factivity: An expert-based dataset and benchmarks","publication_year":2023,"publication_date":"2023-06-01","ids":{"openalex":"https://openalex.org/W4379013364","doi":"https://doi.org/10.1017/s1351324923000220"},"language":"en","primary_location":{"id":"doi:10.1017/s1351324923000220","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1017/s1351324923000220","pdf_url":"https://www.cambridge.org/core/services/aop-cambridge-core/content/view/3B630FD89EA9B9F0AD6B430D8976CBA2/S1351324923000220a.pdf/div-class-title-polish-natural-language-inference-and-factivity-an-expert-based-dataset-and-benchmarks-div.pdf","source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://www.cambridge.org/core/services/aop-cambridge-core/content/view/3B630FD89EA9B9F0AD6B430D8976CBA2/S1351324923000220a.pdf/div-class-title-polish-natural-language-inference-and-factivity-an-expert-based-dataset-and-benchmarks-div.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067792890","display_name":"Daniel Ziembicki","orcid":"https://orcid.org/0000-0003-0506-4751"},"institutions":[{"id":"https://openalex.org/I4654613","display_name":"University of Warsaw","ror":"https://ror.org/039bjqg32","country_code":"PL","type":"education","lineage":["https://openalex.org/I4654613"]}],"countries":["PL"],"is_corresponding":true,"raw_author_name":"Daniel Ziembicki","raw_affiliation_strings":["Department of Formal Linguistics, University of Warsaw, Warsaw, Poland"],"raw_orcid":"https://orcid.org/0000-0003-0506-4751","affiliations":[{"raw_affiliation_string":"Department of Formal Linguistics, University of Warsaw, Warsaw, Poland","institution_ids":["https://openalex.org/I4654613"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010611519","display_name":"Karolina Seweryn","orcid":"https://orcid.org/0000-0003-0617-7301"},"institutions":[{"id":"https://openalex.org/I108403487","display_name":"Warsaw University of Technology","ror":"https://ror.org/00y0xnp53","country_code":"PL","type":"education","lineage":["https://openalex.org/I108403487"]},{"id":"https://openalex.org/I4210136276","display_name":"NASK National Research Institute","ror":"https://ror.org/03ajsaw82","country_code":"PL","type":"facility","lineage":["https://openalex.org/I4210136276"]}],"countries":["PL"],"is_corresponding":false,"raw_author_name":"Karolina Seweryn","raw_affiliation_strings":["Faculty of Mathematics and Information Science, Warsaw University of Technology, Warsaw, Poland","NASK - National Research Institute, Warsaw, Poland"],"raw_orcid":"https://orcid.org/0000-0003-0617-7301","affiliations":[{"raw_affiliation_string":"Faculty of Mathematics and Information Science, Warsaw University of Technology, Warsaw, Poland","institution_ids":["https://openalex.org/I108403487"]},{"raw_affiliation_string":"NASK - National Research Institute, Warsaw, Poland","institution_ids":["https://openalex.org/I4210136276"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031984813","display_name":"Anna Wr\u00f3blewska","orcid":"https://orcid.org/0000-0002-3407-7570"},"institutions":[{"id":"https://openalex.org/I108403487","display_name":"Warsaw University of Technology","ror":"https://ror.org/00y0xnp53","country_code":"PL","type":"education","lineage":["https://openalex.org/I108403487"]}],"countries":["PL"],"is_corresponding":false,"raw_author_name":"Anna Wr\u00f3blewska","raw_affiliation_strings":["Faculty of Mathematics and Information Science, Warsaw University of Technology, Warsaw, Poland"],"raw_orcid":"https://orcid.org/0000-0002-3407-7570","affiliations":[{"raw_affiliation_string":"Faculty of Mathematics and Information Science, Warsaw University of Technology, Warsaw, Poland","institution_ids":["https://openalex.org/I108403487"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5067792890"],"corresponding_institution_ids":["https://openalex.org/I4654613"],"apc_list":null,"apc_paid":null,"fwci":0.3313,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.63503629,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":"30","issue":"2","first_page":"385","last_page":"416"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.7133697867393494},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.675664484500885},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.611798107624054},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5477790236473083},{"id":"https://openalex.org/keywords/natural","display_name":"Natural (archaeology)","score":0.4564424157142639},{"id":"https://openalex.org/keywords/history","display_name":"History","score":0.09532582759857178}],"concepts":[{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.7133697867393494},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.675664484500885},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.611798107624054},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5477790236473083},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.4564424157142639},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.09532582759857178},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1017/s1351324923000220","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1017/s1351324923000220","pdf_url":"https://www.cambridge.org/core/services/aop-cambridge-core/content/view/3B630FD89EA9B9F0AD6B430D8976CBA2/S1351324923000220a.pdf/div-class-title-polish-natural-language-inference-and-factivity-an-expert-based-dataset-and-benchmarks-div.pdf","source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1017/s1351324923000220","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1017/s1351324923000220","pdf_url":"https://www.cambridge.org/core/services/aop-cambridge-core/content/view/3B630FD89EA9B9F0AD6B430D8976CBA2/S1351324923000220a.pdf/div-class-title-polish-natural-language-inference-and-factivity-an-expert-based-dataset-and-benchmarks-div.pdf","source":{"id":"https://openalex.org/S18088403","display_name":"Natural Language Engineering","issn_l":"1351-3249","issn":["1351-3249","1469-8110"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Natural Language Engineering","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.5600000023841858}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4379013364.pdf"},"referenced_works_count":67,"referenced_works":["https://openalex.org/W1882160","https://openalex.org/W1045126948","https://openalex.org/W1524295291","https://openalex.org/W1527464542","https://openalex.org/W1649228660","https://openalex.org/W1966510133","https://openalex.org/W1992365294","https://openalex.org/W2006766484","https://openalex.org/W2006941876","https://openalex.org/W2050066130","https://openalex.org/W2065280474","https://openalex.org/W2069395416","https://openalex.org/W2076518434","https://openalex.org/W2082915264","https://openalex.org/W2092358247","https://openalex.org/W2098865355","https://openalex.org/W2134273450","https://openalex.org/W2152191919","https://openalex.org/W2158880898","https://openalex.org/W2251784184","https://openalex.org/W2264742718","https://openalex.org/W2300918978","https://openalex.org/W2329766307","https://openalex.org/W2442082768","https://openalex.org/W2485094106","https://openalex.org/W2488717477","https://openalex.org/W2529466265","https://openalex.org/W2567181374","https://openalex.org/W2567922298","https://openalex.org/W2619809667","https://openalex.org/W2736741497","https://openalex.org/W2887278802","https://openalex.org/W2896457183","https://openalex.org/W2907316163","https://openalex.org/W2911964244","https://openalex.org/W2912581819","https://openalex.org/W2951286828","https://openalex.org/W2962736243","https://openalex.org/W2963154734","https://openalex.org/W2963846996","https://openalex.org/W2963918774","https://openalex.org/W2970438301","https://openalex.org/W2970789589","https://openalex.org/W2970846123","https://openalex.org/W2984256198","https://openalex.org/W2997789497","https://openalex.org/W2998230451","https://openalex.org/W3006474634","https://openalex.org/W3026404337","https://openalex.org/W3035599593","https://openalex.org/W3080275130","https://openalex.org/W3095992020","https://openalex.org/W3105639882","https://openalex.org/W3125670107","https://openalex.org/W3155292524","https://openalex.org/W3198032219","https://openalex.org/W3201344816","https://openalex.org/W4238283717","https://openalex.org/W4238722546","https://openalex.org/W4240179394","https://openalex.org/W4254506686","https://openalex.org/W6669597341","https://openalex.org/W6691910934","https://openalex.org/W6783340080","https://openalex.org/W6800803619","https://openalex.org/W6822886875","https://openalex.org/W6827521035"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2478288626","https://openalex.org/W4391913857","https://openalex.org/W2350741829","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Abstract":[0],"Despite":[1],"recent":[2],"breakthroughs":[3],"in":[4,76,86,113,189,219],"Machine":[5],"Learning":[6],"for":[7,141,234],"Natural":[8,12],"Language":[9,13],"Processing,":[10],"the":[11,33,40,60,66,73,102,126,190,204,213,220],"Inference":[14],"(NLI)":[15],"problems":[16],"still":[17],"constitute":[18],"a":[19,26,110],"challenge.":[20],"To":[21],"this":[22,56,182],"purpose,":[23],"we":[24,58],"contribute":[25],"new":[27],"dataset":[28,80,98],"that":[29,46,146,208],"focuses":[30],"exclusively":[31],"on":[32,101,151,162,179],"factivity":[34],"phenomenon;":[35],"however,":[36],"our":[37],"task":[38],"remains":[39],"same":[41],"as":[42],"other":[43],"NLI":[44,62],"tasks,":[45],"is":[47,99,109],"prediction":[48],"of":[49,68,105,125,212,215],"entailment,":[50],"contradiction,":[51],"or":[52],"neutral":[53],"(ECN).":[54],"In":[55],"paper,":[57],"describe":[59],"LingFeatured":[61],"corpus":[63],"and":[64,88,93,108,227],"present":[65,121],"results":[67,156,168],"analyses":[69],"designed":[70],"to":[71,115],"characterize":[72],"factivity/non-factivity":[74],"opposition":[75],"natural":[77,83],"language.":[78],"The":[79,97],"contains":[81],"entirely":[82],"language":[84],"utterances":[85],"Polish":[87,106],"gathers":[89],"2432":[90],"verb-complement":[91],"pairs":[92],"309":[94],"unique":[95],"verbs.":[96],"based":[100],"National":[103],"Corpus":[104],"(NKJP)":[107],"representative":[111],"subcorpus":[112],"regard":[114],"syntactic":[116],"construction":[117],"[V][\u017ce][cc].":[118],"We":[119,136,144],"also":[120],"an":[122,231],"extended":[123],"version":[124],"set":[127],"(3035":[128],"sentences)":[129],"consisting":[130],"more":[131,185],"sentences":[132,152,206],"with":[133,224],"internal":[134],"negations.":[135],"prepared":[137,195],"deep":[138],"learning":[139],"benchmarks":[140],"both":[142],"sets.":[143],"found":[145],"transformer":[147],"BERT-based":[148,200],"models":[149,201],"working":[150],"obtained":[153],"relatively":[154],"good":[155],"(":[157,174],"$\\approx":[158,175],"89\\%$":[159],"F1":[160,177],"score":[161,178],"base":[163,180],"dataset).":[164],"Even":[165],"though":[166],"better":[167],"were":[169,194],"achieved":[170],"using":[171],"linguistic":[172],"features":[173,193],"91\\%$":[176],"dataset),":[181],"model":[183],"requires":[184],"human":[186],"labor":[187],"(humans":[188],"loop)":[191],"because":[192],"manually":[196],"by":[197],"expert":[198],"linguists.":[199],"consuming":[202],"only":[203],"input":[205],"show":[207],"they":[209],"capture":[210],"most":[211],"complexity":[214],"NLI/factivity.":[216],"Complex":[217],"cases":[218,223],"phenomenon\u2014for":[221],"example,":[222],"entitlement":[225],"(E)":[226],"non-factive":[228],"verbs\u2014still":[229],"remain":[230],"open":[232],"issue":[233],"further":[235],"research.":[236]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
