-
Notifications
You must be signed in to change notification settings - Fork 186
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Check if tests are coupled #1938
base: main
Are you sure you want to change the base?
Conversation
This comment was marked as off-topic.
This comment was marked as off-topic.
Looks like there is some order dependence between our tests. |
Could you describe how this works? I'm not reproducing. To check, I tried running our test suite with each file in an individual subprocess: tests = list.files('tests/testthat', pattern = '^test', full.names = TRUE)
for (test in tests) {
system2("Rscript", c("-e", shQuote(paste(
c(
'attach(asNamespace("lintr"), warn.conflicts=FALSE)',
"library(testthat)",
sprintf('test_file("%s")', test)
),
collapse = ";"
))))
} I see the errors in test-knitr_formats.R and test-object_name_linter.R (trivial fix incoming), but not any others. |
I guess this test also expects library(withr)
library(xml2)
library(xmlparsedata)
tests = list.files('tests/testthat', pattern = '^test', full.names = TRUE)
non_tests = setdiff(list.files('tests/testthat', full.names = TRUE), tests)
# required for assumed directory structure in tests to work in tempdir()
file.copy(non_tests, tempdir(), recursive = TRUE)
unit_xp = "expr/SYMBOL_FUNCTION_CALL[text() = 'test_that' or text() = 'with_parameters_test_that']"
lines_by_xpath <- function(xml, xpath) {
matches <- xml_find_all(xml, xpath)
line1 <- as.integer(xml_attr(matches, "line1"))
line2 <- as.integer(xml_attr(matches, "line2"))
mapply(`:`, line1, line2, SIMPLIFY = FALSE)
}
# NB: "testthat::CompactProgressReporter" is more informative
run_units_individually <- function(test_file, reporter = "testthat::FailReporter") {
message(basename(test_file))
test_xml <- read_xml(xml_parse_data(parse(test_file)))
test_lines <- readLines(test_file)
boilerplate_lines <- lines_by_xpath(test_xml, sprintf("expr[not(%s)]", unit_xp))
test_boilerplate <- test_lines[unlist(boilerplate_lines)]
test_that_units <- lines_by_xpath(test_xml, sprintf("expr[%s]", unit_xp))
for (unit in test_that_units) {
if (reporter == "testthat::FailReporter") message(".", appendLF = FALSE)
unit_name <- gsub(" ", "_", gsub('^[^"]*"|"[^"]*$', '', test_lines[unit[1L]]))
with_tempfile("tmp", pattern = paste0(basename(test_file), "_", unit_name), {
cat(test_boilerplate, file = tmp, sep = "\n")
cat(test_lines[unit], file = tmp, sep = "\n", append = TRUE)
system2(
"Rscript",
env = "TESTTHAT_EDITION=3",
c("-e", shQuote(sprintf(
'testthat::test_file("%s", package = "lintr", reporter = %s)',
tmp, reporter
)))
)
})
}
if (reporter == "testthat::FailReporter") cat("\n")
}
for (test in tests) run_units_individually(test) I see some failures, but not the same as this CI test is giving (omitting passing files):
Investigating more. |
The ones in
|
This is the exact script I am using in the GHA workflow: options(crayon.enabled = TRUE)
withr::local_envvar(TESTTHAT_PARALLEL = "FALSE")
library(cli)
library(glue)
pkgload::load_all(".")
test_script_paths <- testthat::find_test_scripts("tests/testthat")
seed <- sample.int(1e6, 1L)
cli_inform("Chosen seed for the current test run: {seed}")
set.seed(seed)
randomized_test_script_paths <- sample(test_script_paths)
any_test_failures <- FALSE
any_test_errors <- FALSE
test_path <- function(path) {
report <- as.data.frame(testthat::test_file(path, reporter = "silent"))
has_test_failures <- any(report$failed == 1L)
has_test_errors <- any(report$error == 1L)
if (has_test_failures) {
cli_alert_danger(glue("Tests in `{path}` are failing."))
any_test_failures <<- TRUE
failed_tests <- tibble::as_tibble(subset(report, failed == 1L)[, c("test", "result")])
print(glue::glue_data(failed_tests, "Test `{test}` is failing:\n{purrr::pluck(result, 1L, 1L)}"))
}
if (has_test_errors) {
cli_alert_danger(glue("There was error while running tests in `{path}`."))
any_test_errors <<- TRUE
errored_tests <- tibble::as_tibble(subset(report, error == 1L)[, c("test", "result")])
print(glue::glue_data(errored_tests, "Test `{test}` has error:\n{purrr::pluck(result, 1L, 1L)}"))
}
if (!has_test_failures && !has_test_errors) {
cli_alert_success(glue("All tests passing in `{path}`."))
}
}
cli_rule()
cli_inform("Running tests in random order:")
cli_rule()
purrr::walk(randomized_test_script_paths, test_path)
cli_rule()
if (any_test_failures) {
cli_abort("Tests in some files are failing.")
}
if (any_test_errors) {
cli_abort("There was error while running tests in some files.")
}
if (!any_test_failures && !any_test_errors) {
cli_alert_success("Tests from all files are passing!")
}
cli_rule() The approach is very simple: just randomize the order in which each test file is run. Tests within each file are always run in the same order, though. Maybe that's also something that can be included as an additional check. |
I'd suggest putting the script into |
cf. #1937