blob: dadf15e815cc8edb5f4bffe1a05900fab780797d [file] [log] [blame]
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
#' @title RecordBatchReader classes
#' @description `RecordBatchFileReader` and `RecordBatchStreamReader` are
#' interfaces for generating record batches from different input sources.
#' @usage NULL
#' @format NULL
#' @docType class
#' @section Factory:
#'
#' The `RecordBatchFileReader$create()` and `RecordBatchStreamReader$create()`
#' factory methods instantiate the object and
#' take a single argument, named according to the class:
#'
#' - `file` A character file name, raw vector, or Arrow file connection object
#' (e.g. `RandomAccessFile`).
#' - `stream` A raw vector, [Buffer], or `InputStream`.
#'
#' @section Methods:
#'
#' - `$read_next_batch()`: Returns a `RecordBatch`
#' - `$schema()`: Returns a [Schema]
#' - `$batches()`: Returns a list of `RecordBatch`es
#' - `$get_batch(i)`: For `RecordBatchFileReader`, return a particular batch
#' by an integer index.
#' - `$num_record_batches()`: For `RecordBatchFileReader`, see how many batches
#' are in the file.
#'
#' @rdname RecordBatchReader
#' @name RecordBatchReader
#' @include arrow-package.R
RecordBatchReader <- R6Class("RecordBatchReader", inherit = Object,
public = list(
read_next_batch = function() {
shared_ptr(RecordBatch, RecordBatchReader__ReadNext(self))
}
),
active = list(
schema = function() shared_ptr(Schema, RecordBatchReader__schema(self))
)
)
#' @rdname RecordBatchReader
#' @usage NULL
#' @format NULL
#' @export
RecordBatchStreamReader <- R6Class("RecordBatchStreamReader", inherit = RecordBatchReader,
public = list(
batches = function() map(ipc___RecordBatchStreamReader__batches(self), shared_ptr, class = RecordBatch)
)
)
RecordBatchStreamReader$create <- function(stream){
if (inherits(stream, c("raw", "Buffer"))) {
stream <- BufferReader$create(stream)
}
assert_is(stream, "InputStream")
shared_ptr(RecordBatchStreamReader, ipc___RecordBatchStreamReader__Open(stream))
}
#' @rdname RecordBatchReader
#' @usage NULL
#' @format NULL
#' @export
RecordBatchFileReader <- R6Class("RecordBatchFileReader", inherit = Object,
# Why doesn't this inherit from RecordBatchReader?
public = list(
get_batch = function(i) shared_ptr(RecordBatch, ipc___RecordBatchFileReader__ReadRecordBatch(self, i)),
batches = function() map(ipc___RecordBatchFileReader__batches(self), shared_ptr, class = RecordBatch)
),
active = list(
num_record_batches = function() ipc___RecordBatchFileReader__num_record_batches(self),
schema = function() shared_ptr(Schema, ipc___RecordBatchFileReader__schema(self))
)
)
RecordBatchFileReader$create <- function(file) {
file <- make_readable_file(file)
shared_ptr(RecordBatchFileReader, ipc___RecordBatchFileReader__Open(file))
}