From 4b4e2fe41a5b2e469d9b1ca25475a5e0e01ddec5 Mon Sep 17 00:00:00 2001 From: Daniel Date: Sun, 12 May 2024 21:33:01 +0200 Subject: [PATCH] fix --- tests/testthat/test-kruskal_wallis_test.R | 49 +++++++++++++++++++++++ tests/testthat/test-mann_whitney_test.R | 8 ++-- 2 files changed, 53 insertions(+), 4 deletions(-) create mode 100644 tests/testthat/test-kruskal_wallis_test.R diff --git a/tests/testthat/test-kruskal_wallis_test.R b/tests/testthat/test-kruskal_wallis_test.R new file mode 100644 index 00000000..9320816d --- /dev/null +++ b/tests/testthat/test-kruskal_wallis_test.R @@ -0,0 +1,49 @@ +skip_if_not_installed("survey") +skip_if_not_installed("datawizard") + +test_that("kruskal_wallis_test", { +#' data(efc) +#' # Kruskal-Wallis test for elder's age by education +#' kruskal_wallis_test(efc, "e17age", by = "c172code") +#' +#' # when data is in wide-format, specify all relevant continuous +#' # variables in `select` and omit `by` +#' set.seed(123) +#' wide_data <- data.frame( +#' scale1 = runif(20), +#' scale2 = runif(20), +#' scale3 = runif(20) +#' ) +#' kruskal_wallis_test(wide_data, select = c("scale1", "scale2", "scale3")) +#' +#' # same as if we had data in long format, with grouping variable +#' long_data <- data.frame( +#' scales = c(wide_data$scale1, wide_data$scale2, wide_data$scale3), +#' groups = rep(c("A", "B", "C"), each = 20) +#' ) +#' kruskal_wallis_test(long_data, select = "scales", by = "groups") +#' # base R equivalent +#' kruskal.test(scales ~ groups, data = long_data) + data(efc) + set.seed(123) + efc$weight <- abs(rnorm(nrow(efc), 1, 0.3)) + out1 <- mann_whitney_test(efc, "e17age", by = "e16sex") + out2 <- wilcox.test(e17age ~ e16sex, data = efc) + expect_equal(out1$w, out2$statistic, tolerance = 1e-4, ignore_attr = TRUE) + expect_equal(out1$p, out2$p.value, tolerance = 1e-4, ignore_attr = TRUE) + expect_equal(out1$estimate, -1561, tolerance = 1e-4, ignore_attr = TRUE) + expect_equal(out1$r, 0.2571254, tolerance = 1e-4, ignore_attr = TRUE) + + set.seed(123) + wide_data <- data.frame(scale1 = runif(20), scale2 = runif(20)) + out1 <- mann_whitney_test(wide_data, select = c("scale1", "scale2")) + out2 <- wilcox.test(wide_data$scale1, wide_data$scale2) + expect_equal(out1$w, out2$statistic, tolerance = 1e-4, ignore_attr = TRUE) + expect_equal(out1$p, out2$p.value, tolerance = 1e-4, ignore_attr = TRUE) + expect_equal(out1$r, 0.05132394, tolerance = 1e-4, ignore_attr = TRUE) + + out <- mann_whitney_test(efc, "e17age", by = "e16sex", weights = "weight") + expect_equal(out$p, 1.976729e-14, tolerance = 1e-4, ignore_attr = TRUE) + expect_equal(out$estimate, 0.1594972, tolerance = 1e-4, ignore_attr = TRUE) + expect_equal(out$r, 0.2599877, tolerance = 1e-4, ignore_attr = TRUE) +}) diff --git a/tests/testthat/test-mann_whitney_test.R b/tests/testthat/test-mann_whitney_test.R index e079cb93..846cae03 100644 --- a/tests/testthat/test-mann_whitney_test.R +++ b/tests/testthat/test-mann_whitney_test.R @@ -29,8 +29,8 @@ test_that("mann_whitney_test", { test_that("mann_whitney_test, sanity checks", { data(efc) - expect_errpr(mann_whitney_test(efc, "e17age", by = "c172code"), regex = "Only two groups are") - expect_errpr(mann_whitney_test(efc, c("e17age", "c172code", "e16sex")), regex = "You may only specify") - expect_errpr(mann_whitney_test(efc, c("e17age", "c172code"), by = "e17age"), regex = "If `select` specifies more") - expect_errpr(mann_whitney_test(efc, "e17age"), regex = "Only one variable provided") + expect_error(mann_whitney_test(efc, "e17age", by = "c172code"), regex = "Only two groups are") + expect_error(mann_whitney_test(efc, c("e17age", "c172code", "e16sex")), regex = "You may only specify") + expect_error(mann_whitney_test(efc, c("e17age", "c172code"), by = "e17age"), regex = "If `select` specifies more") + expect_error(mann_whitney_test(efc, "e17age"), regex = "Only one variable provided") })