blob: c505ce7faf199de4d668246cdcf4e2dde6d5a7dd [file]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
#pragma once
#include <cassert>
#include <cstdint>
#include <memory>
#include <string_view>
#include <vector>
#include "paimon/common/data/binary_section.h"
#include "paimon/common/data/binary_string.h"
#include "paimon/common/data/internal_array.h"
#include "paimon/common/data/internal_map.h"
#include "paimon/common/data/internal_row.h"
#include "paimon/common/memory/memory_segment_utils.h"
#include "paimon/data/decimal.h"
#include "paimon/data/timestamp.h"
#include "paimon/memory/bytes.h"
#include "paimon/memory/memory_pool.h"
#include "paimon/result.h"
#include "paimon/status.h"
namespace paimon {
class MemorySegment;
/// A binary implementation of `InternalArray` which is backed by a single `MemorySegment`.
/// For fields that hold fixed-length primitive types, such as long, double or int, they are
/// stored compacted in bytes, just like the original C array.
///
/// @note: Unlike the Java implementation where data may span multiple MemorySegments,
/// in this C++ implementation all data resides within a single MemorySegment.
///
/// The binary layout of BinaryArray:
/// [size(int)] + [null bits(4-byte word boundaries)] + [values or offset&length] + [variable length
/// part].
class BinaryArray final : public BinarySection, public InternalArray {
public:
BinaryArray() = default;
static int32_t CalculateHeaderInBytes(int32_t num_fields);
int32_t Size() const override {
return size_;
}
void PointTo(const MemorySegment& segment, int32_t offset, int32_t size_in_bytes) override;
bool IsNullAt(int32_t pos) const override;
bool GetBoolean(int32_t pos) const override;
char GetByte(int32_t pos) const override;
int16_t GetShort(int32_t pos) const override;
int32_t GetInt(int32_t pos) const override;
int32_t GetDate(int32_t pos) const override;
int64_t GetLong(int32_t pos) const override;
float GetFloat(int32_t pos) const override;
double GetDouble(int32_t pos) const override;
BinaryString GetString(int32_t pos) const override;
std::string_view GetStringView(int32_t pos) const override;
Decimal GetDecimal(int32_t pos, int32_t precision, int32_t scale) const override;
Timestamp GetTimestamp(int32_t pos, int32_t precision) const override;
std::shared_ptr<Bytes> GetBinary(int32_t pos) const override;
std::shared_ptr<InternalArray> GetArray(int32_t pos) const override;
std::shared_ptr<InternalMap> GetMap(int32_t pos) const override;
std::shared_ptr<InternalRow> GetRow(int32_t pos, int32_t num_fields) const override;
bool AnyNull() const;
Result<std::vector<char>> ToBooleanArray() const override;
Result<std::vector<char>> ToByteArray() const override;
Result<std::vector<int16_t>> ToShortArray() const override;
Result<std::vector<int32_t>> ToIntArray() const override;
Result<std::vector<int64_t>> ToLongArray() const override;
Result<std::vector<float>> ToFloatArray() const override;
Result<std::vector<double>> ToDoubleArray() const override;
BinaryArray Copy(MemoryPool* pool) const;
void Copy(BinaryArray* reuse, MemoryPool* pool) const;
int32_t HashCode() const override {
return MemorySegmentUtils::HashByWords({segment_}, offset_, size_in_bytes_,
GetDefaultPool().get());
}
static BinaryArray FromIntArray(const std::vector<int32_t>& arr, MemoryPool* pool);
static BinaryArray FromLongArray(const std::vector<int64_t>& arr, MemoryPool* pool);
static BinaryArray FromLongArray(const InternalArray* arr, MemoryPool* pool);
private:
void AssertIndexIsValid(int32_t ordinal) const;
int32_t GetElementOffset(int32_t ordinal, int32_t element_size) const;
Status CheckNoNull() const {
if (AnyNull()) {
return Status::Invalid("Primitive array must not contain a null value.");
}
return Status::OK();
}
private:
/// The number of elements in this array.
int32_t size_ = 0;
/// The position to start storing array elements.
int32_t element_offset_ = -1;
};
} // namespace paimon