aboutsummaryrefslogtreecommitdiff
path: root/R/pkg/inst/tests/testthat/test_sparkSQL.R
diff options
context:
space:
mode:
Diffstat (limited to 'R/pkg/inst/tests/testthat/test_sparkSQL.R')
-rw-r--r--R/pkg/inst/tests/testthat/test_sparkSQL.R21
1 files changed, 21 insertions, 0 deletions
diff --git a/R/pkg/inst/tests/testthat/test_sparkSQL.R b/R/pkg/inst/tests/testthat/test_sparkSQL.R
index aac3f62204..a9bd325895 100644
--- a/R/pkg/inst/tests/testthat/test_sparkSQL.R
+++ b/R/pkg/inst/tests/testthat/test_sparkSQL.R
@@ -2270,6 +2270,27 @@ test_that("dapply() and dapplyCollect() on a DataFrame", {
expect_identical(expected, result)
})
+test_that("dapplyCollect() on DataFrame with a binary column", {
+
+ df <- data.frame(key = 1:3)
+ df$bytes <- lapply(df$key, serialize, connection = NULL)
+
+ df_spark <- createDataFrame(df)
+
+ result1 <- collect(df_spark)
+ expect_identical(df, result1)
+
+ result2 <- dapplyCollect(df_spark, function(x) x)
+ expect_identical(df, result2)
+
+ # A data.frame with a single column of bytes
+ scb <- subset(df, select = "bytes")
+ scb_spark <- createDataFrame(scb)
+ result <- dapplyCollect(scb_spark, function(x) x)
+ expect_identical(scb, result)
+
+})
+
test_that("repartition by columns on DataFrame", {
df <- createDataFrame(
list(list(1L, 1, "1", 0.1), list(1L, 2, "2", 0.2), list(3L, 3, "3", 0.3)),