Skip to content

Commit

Permalink
group_modify
Browse files Browse the repository at this point in the history
  • Loading branch information
krlmlr committed Mar 7, 2024
1 parent e81f3ed commit eed067b
Show file tree
Hide file tree
Showing 8 changed files with 82 additions and 17 deletions.
1 change: 1 addition & 0 deletions NAMESPACE
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,7 @@ S3method(group_by,duckplyr_df)
S3method(group_data,duckplyr_df)
S3method(group_keys,duckplyr_df)
S3method(group_map,duckplyr_df)
S3method(group_modify,duckplyr_df)
S3method(group_vars,duckplyr_df)
S3method(head,duckplyr_df)
S3method(inner_join,duckplyr_df)
Expand Down
37 changes: 37 additions & 0 deletions R/group_modify.R
Original file line number Diff line number Diff line change
@@ -0,0 +1,37 @@
# Generated by 02-duckplyr_df-methods.R
#' @export
group_modify.duckplyr_df <- function(.data, .f, ..., .keep = FALSE, keep = deprecated()) {
# Our implementation
rel_try(
# Always fall back to dplyr
"No relational implementation for group_modify()" = TRUE,
{
return(out)
}
)

# dplyr forward
group_modify <- dplyr$group_modify.data.frame
out <- group_modify(.data, .f, ..., .keep = .keep, keep = keep)
return(out)

# dplyr implementation
if (!missing(keep)) {
lifecycle::deprecate_warn("1.0.0", "group_modify(keep = )", "group_modify(.keep = )", always = TRUE)
.keep <- keep
}
.f <- as_group_map_function(.f)
.f(.data, group_keys(.data), ...)
}

duckplyr_group_modify <- function(.data, ...) {
try_fetch(
.data <- as_duckplyr_df(.data),
error = function(e) {
testthat::skip(conditionMessage(e))
}
)
out <- group_modify(.data, ...)
class(out) <- setdiff(class(out), "duckplyr_df")
out
}
1 change: 1 addition & 0 deletions R/overwrite.R
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,7 @@ methods_overwrite <- function() {
vctrs::s3_register("dplyr::group_data", "data.frame", group_data.duckplyr_df)
vctrs::s3_register("dplyr::group_keys", "data.frame", group_keys.duckplyr_df)
vctrs::s3_register("dplyr::group_map", "data.frame", group_map.duckplyr_df)
vctrs::s3_register("dplyr::group_modify", "data.frame", group_modify.duckplyr_df)
vctrs::s3_register("dplyr::group_vars", "data.frame", group_vars.duckplyr_df)
vctrs::s3_register("dplyr::inner_join", "data.frame", inner_join.duckplyr_df)
vctrs::s3_register("dplyr::intersect", "data.frame", intersect.duckplyr_df)
Expand Down
1 change: 1 addition & 0 deletions R/restore.R
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,7 @@ methods_restore <- function() {
vctrs::s3_register("dplyr::group_data", "data.frame", dplyr$group_data.data.frame)
vctrs::s3_register("dplyr::group_keys", "data.frame", dplyr$group_keys.data.frame)
vctrs::s3_register("dplyr::group_map", "data.frame", dplyr$group_map.data.frame)
vctrs::s3_register("dplyr::group_modify", "data.frame", dplyr$group_modify.data.frame)
vctrs::s3_register("dplyr::group_vars", "data.frame", dplyr$group_vars.data.frame)
vctrs::s3_register("dplyr::inner_join", "data.frame", dplyr$inner_join.data.frame)
vctrs::s3_register("dplyr::intersect", "data.frame", dplyr$intersect.data.frame)
Expand Down
8 changes: 8 additions & 0 deletions dplyr-methods/group_modify.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,8 @@
group_modify.data.frame <- function(.data, .f, ..., .keep = FALSE, keep = deprecated()) {
if (!missing(keep)) {
lifecycle::deprecate_warn("1.0.0", "group_modify(keep = )", "group_modify(.keep = )", always = TRUE)
.keep <- keep
}
.f <- as_group_map_function(.f)
.f(.data, group_keys(.data), ...)
}
16 changes: 16 additions & 0 deletions tests/testthat/test-as_duckplyr_df.R
Original file line number Diff line number Diff line change
Expand Up @@ -802,6 +802,22 @@ test_that("as_duckplyr_df() and group_map(~ .x)", {
expect_equal(pre, post)
})

test_that("as_duckplyr_df() and group_modify(~ .x)", {
withr::local_envvar(DUCKPLYR_FORCE = "FALSE")

skip("Grouped")

# Data
test_df <- data.frame(a = 1:6 + 0, b = 2, g = rep(1:3, 1:3))

# Run
pre <- test_df %>% as_duckplyr_df() %>% group_modify(~ .x)
post <- test_df %>% group_modify(~ .x) %>% as_duckplyr_df()

# Compare
expect_equal(pre, post)
})

test_that("as_duckplyr_df() and group_vars()", {
withr::local_envvar(DUCKPLYR_FALLBACK_FORCE = "TRUE")

Expand Down
32 changes: 16 additions & 16 deletions tests/testthat/test-group-map.R
Original file line number Diff line number Diff line change
Expand Up @@ -30,40 +30,40 @@ test_that("duckplyr_group_map() works on ungrouped data frames (#4067)", {
)
})

test_that("group_modify() makes a grouped_df", {
test_that("duckplyr_group_modify() makes a grouped_df", {
res <- duckplyr_group_by(mtcars, cyl) %>%
group_modify(~ head(.x, 2L))
duckplyr_group_modify(~ head(.x, 2L))

expect_equal(nrow(res), 6L)
expect_equal(group_rows(res), list_of(1:2, 3:4, 5:6))

res <- iris %>%
duckplyr_group_by(Species) %>%
duckplyr_filter(Species == "setosa") %>%
group_modify(~ tally(.x))
duckplyr_group_modify(~ tally(.x))
expect_equal(nrow(res), 1L)
expect_equal(group_rows(res), list_of(1L))

res <- iris %>%
duckplyr_group_by(Species, .drop = FALSE) %>%
duckplyr_filter(Species == "setosa") %>%
group_modify(~ tally(.x))
duckplyr_group_modify(~ tally(.x))
expect_equal(nrow(res), 3L)
expect_equal(as.list(group_rows(res)), list(1L, 2L, 3L))
})

test_that("group_modify() and duckplyr_group_map() want functions with at least 2 arguments, or ... (#3996)", {
test_that("duckplyr_group_modify() and duckplyr_group_map() want functions with at least 2 arguments, or ... (#3996)", {
head1 <- function(d, ...) head(d, 1)

g <- iris %>% duckplyr_group_by(Species)
expect_equal(nrow(group_modify(g, head1)), 3L)
expect_equal(nrow(duckplyr_group_modify(g, head1)), 3L)
expect_equal(length(duckplyr_group_map(g, head1)), 3L)
})

test_that("group_modify() works on ungrouped data frames (#4067)", {
test_that("duckplyr_group_modify() works on ungrouped data frames (#4067)", {
skip("TODO duckdb")
expect_identical(
group_modify(mtcars, ~ head(.x, 2L)),
duckplyr_group_modify(mtcars, ~ head(.x, 2L)),
head(mtcars, 2L)
)
})
Expand All @@ -80,15 +80,15 @@ test_that("duckplyr_group_map() uses ptype on empty splits (#4421)", {
expect_s3_class(ptype, "data.frame")
})

test_that("group_modify() uses ptype on empty splits (#4421)", {
test_that("duckplyr_group_modify() uses ptype on empty splits (#4421)", {
res <- mtcars %>%
duckplyr_group_by(cyl) %>%
duckplyr_filter(hp > 1000) %>%
group_modify(~.x)
duckplyr_group_modify(~.x)
expect_equal(res, duckplyr_group_by(mtcars[integer(0L), names(res)], cyl))
})

test_that("group_modify() works with additional arguments (#4509)", {
test_that("duckplyr_group_modify() works with additional arguments (#4509)", {
myfun <- function(.x, .y, foo) {
.x[[foo]] <- 1
.x
Expand All @@ -103,7 +103,7 @@ test_that("group_modify() works with additional arguments (#4509)", {
targetdata$bar <- 1

expect_equal(
group_modify(.data = srcdata, .f = myfun, foo = "bar"),
duckplyr_group_modify(.data = srcdata, .f = myfun, foo = "bar"),
targetdata
)
})
Expand All @@ -119,10 +119,10 @@ test_that("duckplyr_group_map() give meaningful errors", {
head1 <- function(d) head(d, 1)

expect_snapshot({
# group_modify()
(expect_error(mtcars %>% duckplyr_group_by(cyl) %>% group_modify(~ data.frame(cyl = 19))))
(expect_error(mtcars %>% duckplyr_group_by(cyl) %>% group_modify(~ 10)))
(expect_error(iris %>% duckplyr_group_by(Species) %>% group_modify(head1)))
# duckplyr_group_modify()
(expect_error(mtcars %>% duckplyr_group_by(cyl) %>% duckplyr_group_modify(~ data.frame(cyl = 19))))
(expect_error(mtcars %>% duckplyr_group_by(cyl) %>% duckplyr_group_modify(~ 10)))
(expect_error(iris %>% duckplyr_group_by(Species) %>% duckplyr_group_modify(head1)))

# duckplyr_group_map()
(expect_error(iris %>% duckplyr_group_by(Species) %>% duckplyr_group_map(head1)))
Expand Down
3 changes: 2 additions & 1 deletion tools/00-funs.R
Original file line number Diff line number Diff line change
Expand Up @@ -16,7 +16,7 @@ df_methods <-
filter(!grepl("_$|^as[.]tbl$", name)) %>%
# special dplyr methods, won't implement
filter(!(name %in% c(
"group_indices", "group_modify", "group_nest", "group_size", "group_split", "group_trim", "groups", "n_groups",
"group_indices", "group_nest", "group_size", "group_split", "group_trim", "groups", "n_groups",
"same_src", # data frames can be copied into duck-frames with zero cost
NULL
))) %>%
Expand All @@ -28,6 +28,7 @@ df_methods <-
"group_data",
"group_keys",
"group_map",
"group_modify",
"rowwise",
NULL
))) %>%
Expand Down

0 comments on commit eed067b

Please sign in to comment.