{"id":"https://openalex.org/W2111216449","doi":"https://doi.org/10.3115/v1/w14-1601","title":"What's in a p-value in NLP?","display_name":"What's in a p-value in NLP?","publication_year":2014,"publication_date":"2014-01-01","ids":{"openalex":"https://openalex.org/W2111216449","doi":"https://doi.org/10.3115/v1/w14-1601","mag":"2111216449"},"language":"en","primary_location":{"id":"doi:10.3115/v1/w14-1601","is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/w14-1601","pdf_url":"https://aclanthology.org/W14-1601.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Eighteenth Conference on Computational Natural Language Learning","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/W14-1601.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5018138946","display_name":"Anders S\u00f8gaard","orcid":"https://orcid.org/0000-0001-5250-4276"},"institutions":[{"id":"https://openalex.org/I124055696","display_name":"University of Copenhagen","ror":"https://ror.org/035b05819","country_code":"DK","type":"education","lineage":["https://openalex.org/I124055696"]}],"countries":["DK"],"is_corresponding":true,"raw_author_name":"Anders S\u00f8gaard","raw_affiliation_strings":["University of Copenhagen"],"affiliations":[{"raw_affiliation_string":"University of Copenhagen","institution_ids":["https://openalex.org/I124055696"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108243977","display_name":"Anders Johannsen","orcid":null},"institutions":[{"id":"https://openalex.org/I124055696","display_name":"University of Copenhagen","ror":"https://ror.org/035b05819","country_code":"DK","type":"education","lineage":["https://openalex.org/I124055696"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Anders Johannsen","raw_affiliation_strings":["University of Copenhagen, Copenhagen, Denmark"],"affiliations":[{"raw_affiliation_string":"University of Copenhagen, Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088832285","display_name":"Barbara Plank","orcid":"https://orcid.org/0000-0002-4394-1965"},"institutions":[{"id":"https://openalex.org/I124055696","display_name":"University of Copenhagen","ror":"https://ror.org/035b05819","country_code":"DK","type":"education","lineage":["https://openalex.org/I124055696"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Barbara Plank","raw_affiliation_strings":["University of Copenhagen, Copenhagen, Denmark"],"affiliations":[{"raw_affiliation_string":"University of Copenhagen, Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084505122","display_name":"Dirk Hovy","orcid":"https://orcid.org/0000-0002-4618-3127"},"institutions":[{"id":"https://openalex.org/I124055696","display_name":"University of Copenhagen","ror":"https://ror.org/035b05819","country_code":"DK","type":"education","lineage":["https://openalex.org/I124055696"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Dirk Hovy","raw_affiliation_strings":["University of Copenhagen, Copenhagen, Denmark"],"affiliations":[{"raw_affiliation_string":"University of Copenhagen, Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5014924576","display_name":"H\u0117ctor Mart\u00ednez Alonso","orcid":null},"institutions":[{"id":"https://openalex.org/I124055696","display_name":"University of Copenhagen","ror":"https://ror.org/035b05819","country_code":"DK","type":"education","lineage":["https://openalex.org/I124055696"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"H\u00e9ctor Mart\u00ednez Alonso","raw_affiliation_strings":["University of Copenhagen, Copenhagen, Denmark"],"affiliations":[{"raw_affiliation_string":"University of Copenhagen, Copenhagen, Denmark","institution_ids":["https://openalex.org/I124055696"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5018138946"],"corresponding_institution_ids":["https://openalex.org/I124055696"],"apc_list":null,"apc_paid":null,"fwci":4.9081,"has_fulltext":false,"cited_by_count":42,"citation_normalized_percentile":{"value":0.95356642,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6087555885314941},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.5898280143737793},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.557659924030304},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.5542786717414856},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.5291545391082764},{"id":"https://openalex.org/keywords/covariate","display_name":"Covariate","score":0.5025084018707275},{"id":"https://openalex.org/keywords/selection-bias","display_name":"Selection bias","score":0.4659505784511566},{"id":"https://openalex.org/keywords/sample-size-determination","display_name":"Sample size determination","score":0.4495408535003662},{"id":"https://openalex.org/keywords/value","display_name":"Value (mathematics)","score":0.42735472321510315},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.42141392827033997},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.3836415410041809},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.36736470460891724},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2802490293979645}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6087555885314941},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.5898280143737793},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.557659924030304},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.5542786717414856},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.5291545391082764},{"id":"https://openalex.org/C119043178","wikidata":"https://www.wikidata.org/wiki/Q320723","display_name":"Covariate","level":2,"score":0.5025084018707275},{"id":"https://openalex.org/C40423286","wikidata":"https://www.wikidata.org/wiki/Q284172","display_name":"Selection bias","level":2,"score":0.4659505784511566},{"id":"https://openalex.org/C129848803","wikidata":"https://www.wikidata.org/wiki/Q2564360","display_name":"Sample size determination","level":2,"score":0.4495408535003662},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.42735472321510315},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.42141392827033997},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.3836415410041809},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36736470460891724},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2802490293979645},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3115/v1/w14-1601","is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/w14-1601","pdf_url":"https://aclanthology.org/W14-1601.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Eighteenth Conference on Computational Natural Language Learning","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.3115/v1/w14-1601","is_oa":true,"landing_page_url":"https://doi.org/10.3115/v1/w14-1601","pdf_url":"https://aclanthology.org/W14-1601.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Eighteenth Conference on Computational Natural Language Learning","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.6600000262260437,"display_name":"No poverty","id":"https://metadata.un.org/sdg/1"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2111216449.pdf","grobid_xml":"https://content.openalex.org/works/W2111216449.grobid-xml"},"referenced_works_count":39,"referenced_works":["https://openalex.org/W1716356","https://openalex.org/W759515131","https://openalex.org/W1515847863","https://openalex.org/W1565746575","https://openalex.org/W1568793342","https://openalex.org/W1594768313","https://openalex.org/W1850558006","https://openalex.org/W1966786910","https://openalex.org/W1995945562","https://openalex.org/W1996430422","https://openalex.org/W2016522586","https://openalex.org/W2027979924","https://openalex.org/W2056451646","https://openalex.org/W2057399676","https://openalex.org/W2075635421","https://openalex.org/W2099032682","https://openalex.org/W2101105183","https://openalex.org/W2101461018","https://openalex.org/W2103374253","https://openalex.org/W2105824687","https://openalex.org/W2111362445","https://openalex.org/W2120354757","https://openalex.org/W2123301721","https://openalex.org/W2133280805","https://openalex.org/W2134899753","https://openalex.org/W2136082655","https://openalex.org/W2142746600","https://openalex.org/W2144578941","https://openalex.org/W2144600658","https://openalex.org/W2148497595","https://openalex.org/W2154652894","https://openalex.org/W2158108973","https://openalex.org/W2161498332","https://openalex.org/W2169438272","https://openalex.org/W2171421863","https://openalex.org/W2252040980","https://openalex.org/W2331384579","https://openalex.org/W2569308312","https://openalex.org/W2600110521"],"related_works":["https://openalex.org/W2985746494","https://openalex.org/W4206042385","https://openalex.org/W2511384863","https://openalex.org/W2080773131","https://openalex.org/W2096089271","https://openalex.org/W2923628599","https://openalex.org/W3023061746","https://openalex.org/W2168206775","https://openalex.org/W2901259384","https://openalex.org/W2112420322"],"abstract_inverted_index":{"In":[0],"NLP,":[1],"we":[2,76,96],"need":[3,77],"to":[4,15,47,58,83,91],"document":[5],"that":[6,33,66],"our":[7],"proposed":[8],"methods":[9],"perform":[10],"significantly":[11],"better":[12],"with":[13],"respect":[14],"standard":[16],"metrics":[17,72],"than":[18],"previous":[19],"approaches,":[20],"typically":[21],"by":[22,26],"reporting":[23],"p-values":[24],"obtained":[25],"rank-":[27],"or":[28],"randomization-based":[29],"tests.":[30],"We":[31,64],"show":[32],"significance":[34,79],"results":[35,90],"following":[36],"current":[37],"research":[38],"standards":[39],"are":[40],"unreliable":[41],"and,":[42],"in":[43,94],"addition,":[44],"very":[45],"sensitive":[46],"sample":[48],"size,":[49],"covariates":[50],"such":[51],"as":[52,55,57],"sentence":[53],"length,":[54],"well":[56],"the":[59,68,85],"existence":[60],"of":[61,70,87],"multiple":[62],"metrics.":[63],"estimate":[65],"under":[67],"assumption":[69],"perfect":[71],"and":[73,102],"unbiased":[74],"data,":[75],"a":[78],"cut-off":[80],"at":[81],"\u21e00.0025":[82],"reduce":[84],"risk":[86],"false":[88],"positive":[89],"<5%.":[92],"Since":[93],"practice":[95],"often":[97],"have":[98],"considerable":[99],"selection":[100],"bias":[101],"poor":[103],"metrics,":[104],"this,":[105],"however,":[106],"will":[107],"not":[108],"do":[109],"alone.":[110]},"counts_by_year":[{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":11},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":8},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":5},{"year":2014,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
