r/tests/testthat/test-Array.R - arrow - Git at Google

 # Licensed to the Apache Software Foundation (ASF) under one
 # or more contributor license agreements.  See the NOTICE file
 # distributed with this work for additional information
 # regarding copyright ownership.  The ASF licenses this file
 # to you under the Apache License, Version 2.0 (the
 # "License"); you may not use this file except in compliance
 # with the License.  You may obtain a copy of the License at
 #
 #   http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing,
 # software distributed under the License is distributed on an
 # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 # KIND, either express or implied.  See the License for the
 # specific language governing permissions and limitations
 # under the License.

 context("Array")

 test_that("Integer Array", {
   ints <- c(1:10, 1:10, 1:5)
   x <- expect_array_roundtrip(ints, int32())
 })

 test_that("binary Array", {
   # if the type is given, we just need a list of raw vectors
   bin <- list(as.raw(1:10), as.raw(1:10))
   expect_array_roundtrip(bin, binary(), as = binary())
   expect_array_roundtrip(bin, large_binary(), as = large_binary())
   expect_array_roundtrip(bin, fixed_size_binary(10), as = fixed_size_binary(10))

   bin[[1L]] <- as.raw(1:20)
   expect_error(Array$create(bin, fixed_size_binary(10)))

   # otherwise the arrow type is deduced from the R classes
   bin <- vctrs::new_vctr(
     list(as.raw(1:10), as.raw(11:20)),
     class = "arrow_binary"
   )
   expect_array_roundtrip(bin, binary())

   bin <- vctrs::new_vctr(
     list(as.raw(1:10), as.raw(11:20)),
     class = "arrow_large_binary"
   )
   expect_array_roundtrip(bin, large_binary())

   bin <- vctrs::new_vctr(
     list(as.raw(1:10), as.raw(11:20)),
     class = "arrow_fixed_size_binary",
     byte_width = 10L
   )
   expect_array_roundtrip(bin, fixed_size_binary(byte_width = 10))

   # degenerate cases
   bin <- vctrs::new_vctr(
     list(1:10),
     class = "arrow_binary"
   )
   expect_error(Array$create(bin))

   bin <- vctrs::new_vctr(
     list(1:10),
     ptype = raw(),
     class = "arrow_large_binary"
   )
   expect_error(Array$create(bin))

   bin <- vctrs::new_vctr(
     list(1:10),
     class = "arrow_fixed_size_binary",
     byte_width = 10
   )
   expect_error(Array$create(bin))

   bin <- vctrs::new_vctr(
     list(as.raw(1:5)),
     class = "arrow_fixed_size_binary",
     byte_width = 10
   )
   expect_error(Array$create(bin))

   bin <- vctrs::new_vctr(
     list(as.raw(1:5)),
     class = "arrow_fixed_size_binary"
   )
   expect_error(Array$create(bin))
 })

 test_that("Slice() and RangeEquals()", {
   ints <- c(1:10, 101:110, 201:205)
   x <- Array$create(ints)

   y <- x$Slice(10)
   expect_equal(y$type, int32())
   expect_equal(length(y), 15L)
   expect_vector(y, c(101:110, 201:205))
   expect_true(x$RangeEquals(y, 10, 24))
   expect_false(x$RangeEquals(y, 9, 23))
   expect_false(x$RangeEquals(y, 11, 24))

   z <- x$Slice(10, 5)
   expect_vector(z, c(101:105))
   expect_true(x$RangeEquals(z, 10, 15, 0))

   # Input validation
   expect_error(x$Slice("ten"))
   expect_error(x$Slice(NA_integer_), "Slice 'offset' cannot be NA")
   expect_error(x$Slice(NA), "Slice 'offset' cannot be NA")
   expect_error(x$Slice(10, "ten"))
   expect_error(x$Slice(10, NA_integer_), "Slice 'length' cannot be NA")
   expect_error(x$Slice(NA_integer_, NA_integer_), "Slice 'offset' cannot be NA")
   expect_error(x$Slice(c(10, 10)))
   expect_error(x$Slice(10, c(10, 10)))
   expect_error(x$Slice(1000), "Slice 'offset' greater than array length")
   expect_error(x$Slice(-1), "Slice 'offset' cannot be negative")
   expect_error(z$Slice(10, 10), "Slice 'offset' greater than array length")
   expect_error(x$Slice(10, -1), "Slice 'length' cannot be negative")
   expect_error(x$Slice(-1, 10), "Slice 'offset' cannot be negative")

   expect_warning(x$Slice(10, 15), NA)
   expect_warning(
     overslice <- x$Slice(10, 16),
     "Slice 'length' greater than available length"
   )
   expect_equal(length(overslice), 15)
   expect_warning(z$Slice(2, 10), "Slice 'length' greater than available length")

   expect_error(x$RangeEquals(10, 24, 0), 'other must be a "Array"')
   expect_error(x$RangeEquals(y, NA, 24), "'start_idx' cannot be NA")
   expect_error(x$RangeEquals(y, 10, NA), "'end_idx' cannot be NA")
   expect_error(x$RangeEquals(y, 10, 24, NA), "'other_start_idx' cannot be NA")
   expect_error(x$RangeEquals(y, "ten", 24))
   # TODO (if anyone uses RangeEquals)
   # expect_error(x$RangeEquals(y, 10, 2400, 0)) # does not error
   # expect_error(x$RangeEquals(y, 1000, 24, 0)) # does not error
   # expect_error(x$RangeEquals(y, 10, 24, 1000)) # does not error
 })

 test_that("Double Array", {
   dbls <- c(1, 2, 3, 4, 5, 6)
   x_dbl <- expect_array_roundtrip(dbls, float64())
 })

 test_that("Array print method includes type", {
   x <- Array$create(c(1:10, 1:10, 1:5))
   expect_output(print(x), "Array\n<int32>\n[\n", fixed = TRUE)
 })

 test_that("Array supports NA", {
   x_int <- Array$create(as.integer(c(1:10, NA)))
   x_dbl <- Array$create(as.numeric(c(1:10, NA)))
   expect_true(x_int$IsValid(0))
   expect_true(x_dbl$IsValid(0L))
   expect_true(x_int$IsNull(10L))
   expect_true(x_dbl$IsNull(10))

   expect_equal(as.vector(is.na(x_int)), c(rep(FALSE, 10), TRUE))
   expect_equal(as.vector(is.na(x_dbl)), c(rep(FALSE, 10), TRUE))

   # Input validation
   expect_error(x_int$IsValid("ten"))
   expect_error(x_int$IsNull("ten"))
   expect_error(x_int$IsValid(c(10, 10)))
   expect_error(x_int$IsNull(c(10, 10)))
   expect_error(x_int$IsValid(NA), "'i' cannot be NA")
   expect_error(x_int$IsNull(NA), "'i' cannot be NA")
   expect_error(x_int$IsValid(1000), "subscript out of bounds")
   expect_error(x_int$IsValid(-1), "subscript out of bounds")
   expect_error(x_int$IsNull(1000), "subscript out of bounds")
   expect_error(x_int$IsNull(-1), "subscript out of bounds")
 })

 test_that("Array support null type (ARROW-7064)", {
   expect_array_roundtrip(vctrs::unspecified(10), null())
 })

 test_that("Array supports logical vectors (ARROW-3341)", {
   # with NA
   x <- sample(c(TRUE, FALSE, NA), 1000, replace = TRUE)
   expect_array_roundtrip(x, bool())

   # without NA
   x <- sample(c(TRUE, FALSE), 1000, replace = TRUE)
   expect_array_roundtrip(x, bool())
 })

 test_that("Array supports character vectors (ARROW-3339)", {
   # without NA
   expect_array_roundtrip(c("itsy", "bitsy", "spider"), utf8())
   expect_array_roundtrip(c("itsy", "bitsy", "spider"), large_utf8(), as = large_utf8())

   # with NA
   expect_array_roundtrip(c("itsy", NA, "spider"), utf8())
   expect_array_roundtrip(c("itsy", NA, "spider"), large_utf8(), as = large_utf8())
 })

 test_that("Character vectors > 2GB become large_utf8", {
   skip_on_cran()
   skip_if_not_running_large_memory_tests()
   big <- make_big_string()
   expect_array_roundtrip(big, large_utf8())
 })

 test_that("empty arrays are supported", {
   expect_array_roundtrip(character(), utf8())
   expect_array_roundtrip(character(), large_utf8(), as = large_utf8())
   expect_array_roundtrip(integer(), int32())
   expect_array_roundtrip(numeric(), float64())
   expect_array_roundtrip(factor(character()), dictionary(int8(), utf8()))
   expect_array_roundtrip(logical(), bool())
 })

 test_that("array with all nulls are supported", {
   nas <- c(NA, NA)
   expect_array_roundtrip(as.character(nas), utf8())
   expect_array_roundtrip(as.integer(nas), int32())
   expect_array_roundtrip(as.numeric(nas), float64())
   expect_array_roundtrip(as.factor(nas), dictionary(int8(), utf8()))
   expect_array_roundtrip(as.logical(nas), bool())
 })

 test_that("Array supports unordered factors (ARROW-3355)", {
   # without NA
   f <- factor(c("itsy", "bitsy", "spider", "spider"))
   expect_array_roundtrip(f, dictionary(int8(), utf8()))

   # with NA
   f <- factor(c("itsy", "bitsy", NA, "spider", "spider"))
   expect_array_roundtrip(f, dictionary(int8(), utf8()))
 })

 test_that("Array supports ordered factors (ARROW-3355)", {
   # without NA
   f <- ordered(c("itsy", "bitsy", "spider", "spider"))
   arr_fac <- expect_array_roundtrip(f, dictionary(int8(), utf8(), ordered = TRUE))
   expect_true(arr_fac$ordered)

   # with NA
   f <- ordered(c("itsy", "bitsy", NA, "spider", "spider"))
   expect_array_roundtrip(f, dictionary(int8(), utf8(), ordered = TRUE))
 })

 test_that("array supports Date (ARROW-3340)", {
   d <- Sys.Date() + 1:10
   expect_array_roundtrip(d, date32())

   d[5] <- NA
   expect_array_roundtrip(d, date32())
 })

 test_that("array supports POSIXct (ARROW-3340)", {
   times <- lubridate::ymd_hms("2018-10-07 19:04:05") + 1:10
   expect_array_roundtrip(times, timestamp("us", "UTC"))

   times[5] <- NA
   expect_array_roundtrip(times, timestamp("us", "UTC"))

   times2 <- lubridate::ymd_hms("2018-10-07 19:04:05", tz = "US/Eastern") + 1:10
   expect_array_roundtrip(times2, timestamp("us", "US/Eastern"))
 })

 test_that("array supports POSIXct without timezone", {
   # Make sure timezone is not set
   withr::with_envvar(c(TZ = ""), {
     times <- strptime("2019-02-03 12:34:56", format="%Y-%m-%d %H:%M:%S") + 1:10
     expect_array_roundtrip(times, timestamp("us", ""))

     # Also test the INTSXP code path
     skip("Ingest_POSIXct only implemented for REALSXP")
     times_int <- as.integer(times)
     attributes(times_int) <- attributes(times)
     expect_array_roundtrip(times_int, timestamp("us", ""))
   })
 })

 test_that("Timezone handling in Arrow roundtrip (ARROW-3543)", {
   # Write a feather file as that's what the initial bug report used
   df <- tibble::tibble(
     no_tz = lubridate::ymd_hms("2018-10-07 19:04:05") + 1:10,
     yes_tz = lubridate::ymd_hms("2018-10-07 19:04:05", tz = "Asia/Pyongyang") + 1:10
   )
   if (!identical(Sys.timezone(), "Asia/Pyongyang")) {
     # Confirming that the columns are in fact different
     expect_false(any(df$no_tz == df$yes_tz))
   }
   feather_file <- tempfile()
   on.exit(unlink(feather_file))
   write_feather(df, feather_file)
   expect_identical(read_feather(feather_file), df)
 })

 test_that("array supports integer64", {
   x <- bit64::as.integer64(1:10) + MAX_INT
   expect_array_roundtrip(x, int64())

   x[4] <- NA
   expect_array_roundtrip(x, int64())

   # all NA int64 (ARROW-3795)
   all_na <- Array$create(bit64::as.integer64(NA))
   expect_type_equal(all_na, int64())
   expect_true(as.vector(is.na(all_na)))
 })

 test_that("array supports difftime", {
   time <- hms::hms(56, 34, 12)
   expect_array_roundtrip(c(time, time), time32("s"))
   expect_array_roundtrip(vctrs::vec_c(NA, time), time32("s"))
 })

 test_that("support for NaN (ARROW-3615)", {
   x <- c(1, NA, NaN, -1)
   y <- Array$create(x)
   expect_true(y$IsValid(2))
   expect_equal(y$null_count, 1L)
 })

 test_that("integer types casts (ARROW-3741)", {
   # Defining some type groups for use here and in the following tests
   int_types <- c(int8(), int16(), int32(), int64())
   uint_types <- c(uint8(), uint16(), uint32(), uint64())
   float_types <- c(float32(), float64()) # float16() not really supported in C++ yet

   a <- Array$create(c(1:10, NA))
   for (type in c(int_types, uint_types)) {
     casted <- a$cast(type)
     expect_equal(casted$type, type)
     expect_identical(as.vector(is.na(casted)), c(rep(FALSE, 10), TRUE))
   }
 })

 test_that("integer types cast safety (ARROW-3741, ARROW-5541)", {
   a <- Array$create(-(1:10))
   for (type in uint_types) {
     expect_error(a$cast(type), regexp = "Integer value -1 not in range")
     expect_error(a$cast(type, safe = FALSE), NA)
   }
 })

 test_that("float types casts (ARROW-3741)", {
   x <- c(1, 2, 3, NA)
   a <- Array$create(x)
   for (type in float_types) {
     casted <- a$cast(type)
     expect_equal(casted$type, type)
     expect_identical(as.vector(is.na(casted)), c(rep(FALSE, 3), TRUE))
     expect_identical(as.vector(casted), x)
   }
 })

 test_that("cast to half float works", {
   skip("Need halffloat support: https://issues.apache.org/jira/browse/ARROW-3802")
   a <- Array$create(1:4)
   a_f16 <- a$cast(float16())
   expect_type_equal(a_16$type, float16())
 })

 test_that("cast input validation", {
   a <- Array$create(1:4)
   expect_error(a$cast("not a type"), "type must be a DataType, not character")
 })

 test_that("Array$create() supports the type= argument. conversion from INTSXP and int64 to all int types", {
   num_int32 <- 12L
   num_int64 <- bit64::as.integer64(10)

   types <- c(
     int_types,
     uint_types,
     float_types,
     double() # not actually a type, a base R function but should be alias for float64
   )
   for (type in types) {
     expect_type_equal(Array$create(num_int32, type = type)$type, as_type(type))
     expect_type_equal(Array$create(num_int64, type = type)$type, as_type(type))
   }

   # Input validation
   expect_error(
     Array$create(5, type = "not a type"),
     "type must be a DataType, not character"
   )
 })

 test_that("Array$create() aborts on overflow", {
   expect_error(Array$create(128L, type = int8()))
   expect_error(Array$create(-129L, type = int8()))

   expect_error(Array$create(256L, type = uint8()))
   expect_error(Array$create(-1L, type = uint8()))

   expect_error(Array$create(32768L, type = int16()))
   expect_error(Array$create(-32769L, type = int16()))

   expect_error(Array$create(65536L, type = uint16()))
   expect_error(Array$create(-1L, type = uint16()))

   expect_error(Array$create(65536L, type = uint16()))
   expect_error(Array$create(-1L, type = uint16()))

   expect_error(Array$create(bit64::as.integer64(2^31), type = int32()))
   expect_error(Array$create(bit64::as.integer64(2^32), type = uint32()))
 })

 test_that("Array$create() does not convert doubles to integer", {
   for (type in c(int_types, uint_types)) {
     a <- Array$create(10, type = type)
     expect_type_equal(a$type, type)
     expect_true(as.vector(a) == 10L)
   }
 })

 test_that("Array$create() converts raw vectors to uint8 arrays (ARROW-3794)", {
   expect_type_equal(Array$create(as.raw(1:10))$type, uint8())
 })

 test_that("Array<int8>$as_vector() converts to integer (ARROW-3794)", {
   i8 <- (-128):127
   a <- Array$create(i8)$cast(int8())
   expect_type_equal(a, int8())
   expect_equal(as.vector(a), i8)

   u8 <- 0:255
   a <- Array$create(u8)$cast(uint8())
   expect_type_equal(a, uint8())
   expect_equal(as.vector(a), u8)
 })

 test_that("Arrays of {,u}int{32,64} convert to integer if they can fit", {
   u32 <- Array$create(1L)$cast(uint32())
   expect_identical(as.vector(u32), 1L)

   u64 <- Array$create(1L)$cast(uint64())
   expect_identical(as.vector(u64), 1L)

   i64 <- Array$create(bit64::as.integer64(1:10))
   expect_identical(as.vector(i64), 1:10)
 })

 test_that("Arrays of uint{32,64} convert to numeric if they can't fit integer", {
   u32 <- Array$create(bit64::as.integer64(1) + MAX_INT)$cast(uint32())
   expect_identical(as.vector(u32), 1 + MAX_INT)

   u64 <- Array$create(bit64::as.integer64(1) + MAX_INT)$cast(uint64())
   expect_identical(as.vector(u64), 1 + MAX_INT)
 })

 test_that("Array$create() recognise arrow::Array (ARROW-3815)", {
   a <- Array$create(1:10)
   expect_equal(a, Array$create(a))
 })

 test_that("Array$create() handles data frame -> struct arrays (ARROW-3811)", {
   df <- tibble::tibble(x = 1:10, y = x / 2, z = letters[1:10])
   a <- Array$create(df)
   expect_type_equal(a$type, struct(x = int32(), y = float64(), z = utf8()))
   expect_equivalent(as.vector(a), df)

   df <- structure(list(col = structure(list(structure(list(list(structure(1))), class = "inner")), class = "outer")), class = "data.frame", row.names = c(NA, -1L))
   a <- Array$create(df)
   expect_type_equal(a$type, struct(col = list_of(list_of(list_of(float64())))))
   expect_equivalent(as.vector(a), df)
 })

 test_that("StructArray methods", {
   df <- tibble::tibble(x = 1:10, y = x / 2, z = letters[1:10])
   a <- Array$create(df)
   expect_equal(a$x, Array$create(df$x))
   expect_equal(a[["x"]], Array$create(df$x))
   expect_equal(a[[1]], Array$create(df$x))
   expect_identical(names(a), c("x", "y", "z"))
   expect_identical(dim(a), c(10L, 3L))
 })

 test_that("Array$create() can handle data frame with custom struct type (not inferred)", {
   df <- tibble::tibble(x = 1:10, y = 1:10)
   type <- struct(x = float64(), y = int16())
   a <- Array$create(df, type = type)
   expect_type_equal(a$type, type)

   type <- struct(x = float64(), y = int16(), z = int32())
   expect_error(Array$create(df, type = type), regexp = "Number of fields in struct.* incompatible with number of columns in the data frame")

   type <- struct(y = int16(), x = float64())
   expect_error(Array$create(df, type = type), regexp = "Field name in position.*does not match the name of the column of the data frame")

   type <- struct(x = float64(), y = utf8())
   expect_error(Array$create(df, type = type), regexp = "Invalid")
 })

 test_that("Array$create() supports tibble with no columns (ARROW-8354)", {
   df <- tibble::tibble()
   expect_equal(Array$create(df)$as_vector(), df)
 })

 test_that("Array$create() handles vector -> list arrays (ARROW-7662)", {
   # Should be able to create an empty list with a type hint.
   expect_r6_class(Array$create(list(), list_of(bool())), "ListArray")

   # logical
   expect_array_roundtrip(list(NA), list_of(bool()))
   expect_array_roundtrip(list(logical(0)), list_of(bool()))
   expect_array_roundtrip(list(c(TRUE), c(FALSE), c(FALSE, TRUE)), list_of(bool()))
   expect_array_roundtrip(list(c(TRUE), c(FALSE), NA, logical(0), c(FALSE, NA, TRUE)), list_of(bool()))

   # integer
   expect_array_roundtrip(list(NA_integer_), list_of(int32()))
   expect_array_roundtrip(list(integer(0)), list_of(int32()))
   expect_array_roundtrip(list(1:2, 3:4, 12:18), list_of(int32()))
   expect_array_roundtrip(list(c(1:2), NA_integer_, integer(0), c(12:18, NA_integer_)), list_of(int32()))

   # numeric
   expect_array_roundtrip(list(NA_real_), list_of(float64()))
   expect_array_roundtrip(list(numeric(0)), list_of(float64()))
   expect_array_roundtrip(list(1, c(2, 3), 4), list_of(float64()))
   expect_array_roundtrip(list(1, numeric(0), c(2, 3, NA_real_), 4), list_of(float64()))

   # character
   expect_array_roundtrip(list(NA_character_), list_of(utf8()))
   expect_array_roundtrip(list(character(0)), list_of(utf8()))
   expect_array_roundtrip(list("itsy", c("bitsy", "spider"), c("is")), list_of(utf8()))
   expect_array_roundtrip(list("itsy", character(0), c("bitsy", "spider", NA_character_), c("is")), list_of(utf8()))

   # factor
   expect_array_roundtrip(list(factor(c("b", "a"), levels = c("a", "b"))), list_of(dictionary(int8(), utf8())))
   expect_array_roundtrip(list(factor(NA, levels = c("a", "b"))), list_of(dictionary(int8(), utf8())))

   # struct
   expect_array_roundtrip(
     list(tibble::tibble(a = integer(0), b = integer(0), c = character(0), d = logical(0))),
     list_of(struct(a = int32(), b = int32(), c = utf8(), d = bool()))
   )
   expect_array_roundtrip(
     list(tibble::tibble(a = list(integer()))),
     list_of(struct(a = list_of(int32())))
   )
   # degenerated data frame
   df <- structure(list(x = 1:2, y = 1), class = "data.frame", row.names = 1:2)
   expect_error(Array$create(list(df)))
 })

 test_that("Array$create() handles vector -> large list arrays", {
   # Should be able to create an empty list with a type hint.
   expect_r6_class(Array$create(list(), type = large_list_of(bool())), "LargeListArray")

   # logical
   expect_array_roundtrip(list(NA), large_list_of(bool()), as = large_list_of(bool()))
   expect_array_roundtrip(list(logical(0)), large_list_of(bool()), as = large_list_of(bool()))
   expect_array_roundtrip(list(c(TRUE), c(FALSE), c(FALSE, TRUE)), large_list_of(bool()), as = large_list_of(bool()))
   expect_array_roundtrip(list(c(TRUE), c(FALSE), NA, logical(0), c(FALSE, NA, TRUE)), large_list_of(bool()), as = large_list_of(bool()))

   # integer
   expect_array_roundtrip(list(NA_integer_), large_list_of(int32()), as = large_list_of(int32()))
   expect_array_roundtrip(list(integer(0)), large_list_of(int32()), as = large_list_of(int32()))
   expect_array_roundtrip(list(1:2, 3:4, 12:18), large_list_of(int32()), as = large_list_of(int32()))
   expect_array_roundtrip(list(c(1:2), NA_integer_, integer(0), c(12:18, NA_integer_)), large_list_of(int32()), as = large_list_of(int32()))

   # numeric
   expect_array_roundtrip(list(NA_real_), large_list_of(float64()), as = large_list_of(float64()))
   expect_array_roundtrip(list(numeric(0)), large_list_of(float64()), as = large_list_of(float64()))
   expect_array_roundtrip(list(1, c(2, 3), 4), large_list_of(float64()), as = large_list_of(float64()))
   expect_array_roundtrip(list(1, numeric(0), c(2, 3, NA_real_), 4), large_list_of(float64()), as = large_list_of(float64()))

   # character
   expect_array_roundtrip(list(NA_character_), large_list_of(utf8()), as = large_list_of(utf8()))
   expect_array_roundtrip(list(character(0)), large_list_of(utf8()), as = large_list_of(utf8()))
   expect_array_roundtrip(list("itsy", c("bitsy", "spider"), c("is")), large_list_of(utf8()), as = large_list_of(utf8()))
   expect_array_roundtrip(list("itsy", character(0), c("bitsy", "spider", NA_character_), c("is")), large_list_of(utf8()), as = large_list_of(utf8()))

   # factor
   expect_array_roundtrip(list(factor(c("b", "a"), levels = c("a", "b"))), large_list_of(dictionary(int8(), utf8())), as = large_list_of(dictionary(int8(), utf8())))
   expect_array_roundtrip(list(factor(NA, levels = c("a", "b"))), large_list_of(dictionary(int8(), utf8())), as = large_list_of(dictionary(int8(), utf8())))

   # struct
   expect_array_roundtrip(
     list(tibble::tibble(a = integer(0), b = integer(0), c = character(0), d = logical(0))),
     large_list_of(struct(a = int32(), b = int32(), c = utf8(), d = bool())),
     as = large_list_of(struct(a = int32(), b = int32(), c = utf8(), d = bool()))
   )
   expect_array_roundtrip(
     list(tibble::tibble(a = list(integer()))),
     large_list_of(struct(a = list_of(int32()))),
     as = large_list_of(struct(a = list_of(int32())))
   )
 })

 test_that("Array$create() handles vector -> fixed size list arrays", {
   # Should be able to create an empty list with a type hint.
   expect_r6_class(Array$create(list(), type = fixed_size_list_of(bool(), 20)), "FixedSizeListArray")

   # logical
   expect_array_roundtrip(list(NA), fixed_size_list_of(bool(), 1L), as = fixed_size_list_of(bool(), 1L))
   expect_array_roundtrip(list(c(TRUE, FALSE), c(FALSE, TRUE)), fixed_size_list_of(bool(), 2L), as = fixed_size_list_of(bool(), 2L))
   expect_array_roundtrip(list(c(TRUE), c(FALSE), NA), fixed_size_list_of(bool(), 1L), as = fixed_size_list_of(bool(), 1L))

   # integer
   expect_array_roundtrip(list(NA_integer_), fixed_size_list_of(int32(), 1L), as = fixed_size_list_of(int32(), 1L))
   expect_array_roundtrip(list(1:2, 3:4, 11:12), fixed_size_list_of(int32(), 2L), as = fixed_size_list_of(int32(), 2L))
   expect_array_roundtrip(list(c(1:2), c(NA_integer_, 3L)), fixed_size_list_of(int32(), 2L), as = fixed_size_list_of(int32(), 2L))

   # numeric
   expect_array_roundtrip(list(NA_real_), fixed_size_list_of(float64(), 1L), as = fixed_size_list_of(float64(), 1L))
   expect_array_roundtrip(list(c(1,2), c(2, 3)), fixed_size_list_of(float64(), 2L), as = fixed_size_list_of(float64(), 2L))
   expect_array_roundtrip(list(c(1,2), c(NA_real_, 4)), fixed_size_list_of(float64(), 2L), as = fixed_size_list_of(float64(), 2L))

   # character
   expect_array_roundtrip(list(NA_character_), fixed_size_list_of(utf8(), 1L), as = fixed_size_list_of(utf8(), 1L))
   expect_array_roundtrip(list(c("itsy", "bitsy"), c("spider", "is"), c(NA_character_, NA_character_), c("", "")), fixed_size_list_of(utf8(), 2L), as = fixed_size_list_of(utf8(), 2L))

   # factor
   expect_array_roundtrip(list(factor(c("b", "a"), levels = c("a", "b"))), fixed_size_list_of(dictionary(int8(), utf8()), 2L), as = fixed_size_list_of(dictionary(int8(), utf8()), 2L))

   # struct
   expect_array_roundtrip(
     list(tibble::tibble(a = 1L, b = 1L, c = "", d = TRUE)),
     fixed_size_list_of(struct(a = int32(), b = int32(), c = utf8(), d = bool()), 1L),
     as = fixed_size_list_of(struct(a = int32(), b = int32(), c = utf8(), d = bool()), 1L)
   )
   expect_array_roundtrip(
     list(tibble::tibble(a = list(1L))),
     fixed_size_list_of(struct(a = list_of(int32())), 1L),
     as = fixed_size_list_of(struct(a = list_of(int32())), 1L)
   )
   expect_array_roundtrip(
     list(tibble::tibble(a = list(1L))),
     list_of(struct(a = fixed_size_list_of(int32(), 1L))),
     as = list_of(struct(a = fixed_size_list_of(int32(), 1L)))
   )
 })

 test_that("Handling string data with embedded nuls", {
   raws <- structure(list(
     as.raw(c(0x70, 0x65, 0x72, 0x73, 0x6f, 0x6e)),
     as.raw(c(0x77, 0x6f, 0x6d, 0x61, 0x6e)),
     as.raw(c(0x6d, 0x61, 0x00, 0x6e)), # <-- there's your nul, 0x00
     as.raw(c(0x66, 0x00, 0x00, 0x61, 0x00, 0x6e)), # multiple nuls
     as.raw(c(0x63, 0x61, 0x6d, 0x65, 0x72, 0x61)),
     as.raw(c(0x74, 0x76))),
     class = c("arrow_binary", "vctrs_vctr", "list"))
   expect_error(
     rawToChar(raws[[3]]),
     "embedded nul in string: 'ma\\0n'", # See?
     fixed = TRUE
   )
   array_with_nul <- Array$create(raws)$cast(utf8())
   expect_error(
     as.vector(array_with_nul),
     "embedded nul in string: 'ma\\0n'; to strip nuls when converting from Arrow to R, set options(arrow.skip_nul = TRUE)",
     fixed = TRUE
   )

   withr::with_options(list(arrow.skip_nul = TRUE), {
     expect_warning(
       expect_identical(
         as.vector(array_with_nul),
         c("person", "woman", "man", "fan", "camera", "tv")
       ),
       "Stripping '\\0' (nul) from character vector",
       fixed = TRUE
     )
   })
 })

 test_that("Array$create() should have helpful error", {
   expect_error(Array$create(list(numeric(0)), list_of(bool())), "Expecting a logical vector")

   lgl <- logical(0)
   int <- integer(0)
   num <- numeric(0)
   char <- character(0)
   expect_error(Array$create(list()), "Requires at least one element to infer")
   expect_error(Array$create(list(lgl, lgl, int)), "Expecting a logical vector")
   expect_error(Array$create(list(char, num, char)), "Expecting a character vector")
 })

 test_that("Array$View() (ARROW-6542)", {
   a <- Array$create(1:3)
   b <- a$View(float32())
   expect_equal(b$type, float32())
   expect_equal(length(b), 3L)

   # Input validation
   expect_error(a$View("not a type"), "type must be a DataType, not character")
 })

 test_that("Array$Validate()", {
   a <- Array$create(1:10)
   expect_error(a$Validate(), NA)
 })

 test_that("is.Array", {
   a <- Array$create(1, type = int32())
   expect_true(is.Array(a))
   expect_true(is.Array(a, "int32"))
   expect_true(is.Array(a, c("int32", "int16")))
   expect_false(is.Array(a, "utf8"))
   expect_true(is.Array(a$View(float32())), "float32")
   expect_false(is.Array(1))
   expect_true(is.Array(ChunkedArray$create(1, 2)))
 })

 test_that("Array$Take()", {
   a <- Array$create(10:20)
   expect_equal(as.vector(a$Take(c(4, 2))), c(14, 12))
 })

 test_that("[ method on Array", {
   vec <- 11:20
   a <- Array$create(vec)
   expect_vector(a[5:9], vec[5:9])
   expect_vector(a[c(9, 3, 5)], vec[c(9, 3, 5)])
   expect_vector(a[rep(c(TRUE, FALSE), 5)], vec[c(1, 3, 5, 7, 9)])
   expect_vector(a[rep(c(TRUE, FALSE, NA, FALSE, TRUE), 2)], c(11, NA, 15, 16, NA, 20))
   expect_vector(a[-4], vec[-4])
   expect_vector(a[-1], vec[-1])
 })

 test_that("[ accepts Arrays and otherwise handles bad input", {
   vec <- 11:20
   a <- Array$create(vec)
   ind <- c(9, 3, 5)
   expect_error(
     a[Array$create(ind)],
     "Cannot extract rows with an Array of type double"
   )
   expect_vector(a[Array$create(ind - 1, type = int8())], vec[ind])
   expect_vector(a[Array$create(ind - 1, type = uint8())], vec[ind])
   expect_vector(a[ChunkedArray$create(8, 2, 4, type = uint8())], vec[ind])

   filt <- seq_along(vec) %in% ind
   expect_vector(a[Array$create(filt)], vec[filt])

   expect_error(
     a["string"],
     "Cannot extract rows with an object of class character"
   )
 })

 test_that("%in% works on dictionary arrays", {
   a1 <- Array$create(as.factor(c("A", "B", "C")))
   a2 <- DictionaryArray$create(c(0L, 1L, 2L), c(4.5, 3.2, 1.1))
   c1 <- Array$create(c(FALSE, TRUE, FALSE))
   c2 <- Array$create(c(FALSE, FALSE, FALSE))
   b1 <- Array$create("B")
   b2 <- Array$create(5.4)

   expect_equal(is_in(a1, b1), c1)
   expect_equal(is_in(a2, b2), c2)
   expect_error(is_in(a1, b2))
 })

 test_that("[ accepts Expressions", {
   vec <- 11:20
   a <- Array$create(vec)
   b <- Array$create(1:10)
   expect_vector(a[b > 4], vec[5:10])
 })

 test_that("Array head/tail", {
   vec <- 11:20
   a <- Array$create(vec)
   expect_vector(head(a), head(vec))
   expect_vector(head(a, 4), head(vec, 4))
   expect_vector(head(a, 40), head(vec, 40))
   expect_vector(head(a, -4), head(vec, -4))
   expect_vector(head(a, -40), head(vec, -40))
   expect_vector(tail(a), tail(vec))
   expect_vector(tail(a, 4), tail(vec, 4))
   expect_vector(tail(a, 40), tail(vec, 40))
   expect_vector(tail(a, -40), tail(vec, -40))
 })

 test_that("Dictionary array: create from arrays, not factor", {
   a <- DictionaryArray$create(c(2L, 1L, 1L, 2L, 0L), c(4.5, 3.2, 1.1))
   expect_equal(a$type, dictionary(int32(), float64()))
 })

 test_that("Dictionary array: translate to R when dict isn't string", {
   a <- DictionaryArray$create(c(2L, 1L, 1L, 2L, 0L), c(4.5, 3.2, 1.1))
   expect_warning(
     expect_identical(
       as.vector(a),
       factor(c(3, 2, 2, 3, 1), labels = c("4.5", "3.2", "1.1"))
     )
   )
 })

 test_that("Array$Equals", {
   vec <- 11:20
   a <- Array$create(vec)
   b <- Array$create(vec)
   d <- Array$create(3:4)
   expect_equal(a, b)
   expect_true(a$Equals(b))
   expect_false(a$Equals(vec))
   expect_false(a$Equals(d))
 })

 test_that("Array$ApproxEquals", {
   vec <- c(1.0000000000001, 2.400000000000001)
   a <- Array$create(vec)
   b <- Array$create(round(vec, 1))
   expect_false(a$Equals(b))
   expect_true(a$ApproxEquals(b))
   expect_false(a$ApproxEquals(vec))
 })

 test_that("auto int64 conversion to int can be disabled (ARROW-10093)", {
   withr::with_options(list(arrow.int64_downcast = FALSE), {
     a <- Array$create(1:10, int64())
     expect_true(inherits(a$as_vector(), "integer64"))

     batch <- RecordBatch$create(x = a)
     expect_true(inherits(as.data.frame(batch)$x, "integer64"))

     tab <- Table$create(x = a)
     expect_true(inherits(as.data.frame(batch)$x, "integer64"))
   })
 })