| // Licensed to the Apache Software Foundation (ASF) under one or more |
| // contributor license agreements. See the NOTICE file distributed with |
| // this work for additional information regarding copyright ownership. |
| // The ASF licenses this file to You under the Apache License, Version 2.0 |
| // (the "License"); you may not use this file except in compliance with |
| // the License. You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, software |
| // distributed under the License is distributed on an "AS IS" BASIS, |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| // See the License for the specific language governing permissions and |
| // limitations under the License. |
| |
| using System; |
| using System.Collections.Generic; |
| using System.Linq; |
| using Apache.Arrow.Memory; |
| using Apache.Arrow.Types; |
| |
| namespace Apache.Arrow |
| { |
| public sealed class ArrayData : IDisposable |
| { |
| private const int RecalculateNullCount = -1; |
| |
| public readonly IArrowType DataType; |
| public readonly int Length; |
| |
| /// <summary> |
| /// The number of null values in the Array. May be -1 if the null count has not been computed. |
| /// </summary> |
| public int NullCount; |
| |
| public readonly int Offset; |
| public readonly ArrowBuffer[] Buffers; |
| public readonly ArrayData[] Children; |
| public readonly ArrayData Dictionary; // Only used for dictionary type |
| |
| /// <summary> |
| /// Get the number of null values in the Array, computing the count if required. |
| /// </summary> |
| public int GetNullCount() |
| { |
| if (NullCount == RecalculateNullCount) |
| { |
| NullCount = ComputeNullCount(); |
| } |
| |
| return NullCount; |
| } |
| |
| // This is left for compatibility with lower version binaries |
| // before the dictionary type was supported. |
| public ArrayData( |
| IArrowType dataType, |
| int length, int nullCount, int offset, |
| IEnumerable<ArrowBuffer> buffers, IEnumerable<ArrayData> children) : |
| this(dataType, length, nullCount, offset, buffers, children, null) |
| { } |
| |
| // This is left for compatibility with lower version binaries |
| // before the dictionary type was supported. |
| public ArrayData( |
| IArrowType dataType, |
| int length, int nullCount, int offset, |
| ArrowBuffer[] buffers, ArrayData[] children) : |
| this(dataType, length, nullCount, offset, buffers, children, null) |
| { } |
| |
| public ArrayData( |
| IArrowType dataType, |
| int length, int nullCount = 0, int offset = 0, |
| IEnumerable<ArrowBuffer> buffers = null, IEnumerable<ArrayData> children = null, ArrayData dictionary = null) |
| { |
| DataType = dataType ?? NullType.Default; |
| Length = length; |
| NullCount = nullCount; |
| Offset = offset; |
| Buffers = buffers?.ToArray(); |
| Children = children?.ToArray(); |
| Dictionary = dictionary; |
| } |
| |
| public ArrayData( |
| IArrowType dataType, |
| int length, int nullCount = 0, int offset = 0, |
| ArrowBuffer[] buffers = null, ArrayData[] children = null, ArrayData dictionary = null) |
| { |
| DataType = dataType ?? NullType.Default; |
| Length = length; |
| NullCount = nullCount; |
| Offset = offset; |
| Buffers = buffers; |
| Children = children; |
| Dictionary = dictionary; |
| } |
| |
| public void Dispose() |
| { |
| if (Buffers != null) |
| { |
| foreach (ArrowBuffer buffer in Buffers) |
| { |
| buffer.Dispose(); |
| } |
| } |
| |
| if (Children != null) |
| { |
| foreach (ArrayData child in Children) |
| { |
| child?.Dispose(); |
| } |
| } |
| |
| Dictionary?.Dispose(); |
| } |
| |
| public ArrayData Slice(int offset, int length) |
| { |
| if (offset > Length) |
| { |
| throw new ArgumentException($"Offset {offset} cannot be greater than Length {Length} for Array.Slice"); |
| } |
| |
| length = Math.Min(Length - offset, length); |
| offset += Offset; |
| |
| int nullCount; |
| if (NullCount == 0) |
| { |
| nullCount = 0; |
| } |
| else if (NullCount == Length) |
| { |
| nullCount = length; |
| } |
| else if (offset == Offset && length == Length) |
| { |
| nullCount = NullCount; |
| } |
| else |
| { |
| nullCount = RecalculateNullCount; |
| } |
| |
| return new ArrayData(DataType, length, nullCount, offset, Buffers, Children, Dictionary); |
| } |
| |
| public ArrayData Clone(MemoryAllocator allocator = default) |
| { |
| return new ArrayData( |
| DataType, |
| Length, |
| NullCount, |
| Offset, |
| Buffers?.Select(b => b.Clone(allocator))?.ToArray(), |
| Children?.Select(b => b.Clone(allocator))?.ToArray(), |
| Dictionary?.Clone(allocator)); |
| } |
| |
| private int ComputeNullCount() |
| { |
| if (DataType.TypeId == ArrowTypeId.Union) |
| { |
| return UnionArray.ComputeNullCount(this); |
| } |
| |
| if (Buffers == null || Buffers.Length == 0 || Buffers[0].IsEmpty) |
| { |
| return 0; |
| } |
| |
| // Note: Dictionary arrays may be logically null if there is a null in the dictionary values, |
| // but this isn't accounted for by the IArrowArray.IsNull implementation, |
| // so we maintain consistency with that behaviour here. |
| |
| return Length - BitUtility.CountBits(Buffers[0].Span, Offset, Length); |
| } |
| } |
| } |