| /** |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| #ifndef TYPE_IMPL_HH |
| #define TYPE_IMPL_HH |
| |
| #include "orc/Type.hh" |
| |
| #include "Adaptor.hh" |
| #include "wrap/orc-proto-wrapper.hh" |
| |
| #include <vector> |
| |
| namespace orc { |
| |
| class TypeImpl: public Type { |
| private: |
| TypeImpl* parent; |
| mutable int64_t columnId; |
| mutable int64_t maximumColumnId; |
| TypeKind kind; |
| std::vector<std::unique_ptr<Type>> subTypes; |
| std::vector<std::string> fieldNames; |
| uint64_t subtypeCount; |
| uint64_t maxLength; |
| uint64_t precision; |
| uint64_t scale; |
| |
| public: |
| /** |
| * Create most of the primitive types. |
| */ |
| TypeImpl(TypeKind kind); |
| |
| /** |
| * Create char and varchar type. |
| */ |
| TypeImpl(TypeKind kind, uint64_t maxLength); |
| |
| /** |
| * Create decimal type. |
| */ |
| TypeImpl(TypeKind kind, uint64_t precision, |
| uint64_t scale); |
| |
| uint64_t getColumnId() const override; |
| |
| uint64_t getMaximumColumnId() const override; |
| |
| TypeKind getKind() const override; |
| |
| uint64_t getSubtypeCount() const override; |
| |
| const Type* getSubtype(uint64_t i) const override; |
| |
| const std::string& getFieldName(uint64_t i) const override; |
| |
| uint64_t getMaximumLength() const override; |
| |
| uint64_t getPrecision() const override; |
| |
| uint64_t getScale() const override; |
| |
| std::string toString() const override; |
| |
| Type* addStructField(const std::string& fieldName, |
| std::unique_ptr<Type> fieldType) override; |
| Type* addUnionChild(std::unique_ptr<Type> fieldType) override; |
| |
| std::unique_ptr<ColumnVectorBatch> createRowBatch(uint64_t size, |
| MemoryPool& memoryPool, |
| bool encoded = false |
| ) const override; |
| |
| /** |
| * Explicitly set the column ids. Only for internal usage. |
| */ |
| void setIds(uint64_t columnId, uint64_t maxColumnId); |
| |
| /** |
| * Add a child type. |
| */ |
| void addChildType(std::unique_ptr<Type> childType); |
| |
| static std::vector<std::pair<std::string, std::unique_ptr<Type> > > parseType( |
| const std::string &input, |
| size_t start, |
| size_t end); |
| |
| private: |
| /** |
| * Assign ids to this node and its children giving this |
| * node rootId. |
| * @param rootId the column id that should be assigned to this node. |
| */ |
| uint64_t assignIds(uint64_t rootId) const; |
| |
| /** |
| * Ensure that ids are assigned to all of the nodes. |
| */ |
| void ensureIdAssigned() const; |
| |
| /** |
| * Parse array type from string |
| * @param input the input string of an array type |
| * @param start start position of the input string |
| * @param end end position of the input string |
| */ |
| static std::unique_ptr<Type> parseArrayType(const std::string &input, |
| size_t start, |
| size_t end); |
| |
| /** |
| * Parse map type from string |
| * @param input the input string of a map type |
| * @param start start position of the input string |
| * @param end end position of the input string |
| */ |
| static std::unique_ptr<Type> parseMapType(const std::string &input, |
| size_t start, |
| size_t end); |
| |
| /** |
| * Parse struct type from string |
| * @param input the input string of a struct type |
| * @param start start position of the input string |
| * @param end end position of the input string |
| */ |
| static std::unique_ptr<Type> parseStructType(const std::string &input, |
| size_t start, |
| size_t end); |
| |
| /** |
| * Parse union type from string |
| * @param input the input string of an union type |
| * @param start start position of the input string |
| * @param end end position of the input string |
| */ |
| static std::unique_ptr<Type> parseUnionType(const std::string &input, |
| size_t start, |
| size_t end); |
| |
| /** |
| * Parse decimal type from string |
| * @param input the input string of a decimal type |
| * @param start start position of the input string |
| * @param end end position of the input string |
| */ |
| static std::unique_ptr<Type> parseDecimalType(const std::string &input, |
| size_t start, |
| size_t end); |
| |
| /** |
| * Parse type for a category |
| * @param category type name |
| * @param input the input string of the category |
| * @param start start position of the input string |
| * @param end end position of the input string |
| */ |
| static std::unique_ptr<Type> parseCategory(std::string category, |
| const std::string &input, |
| size_t start, |
| size_t end); |
| }; |
| |
| std::unique_ptr<Type> convertType(const proto::Type& type, |
| const proto::Footer& footer); |
| |
| /** |
| * Build a clone of the file type, projecting columns from the selected |
| * vector. This routine assumes that the parent of any selected column |
| * is also selected. |
| * @param fileType the type in the file |
| * @param selected is each column by id selected |
| * @return a clone of the fileType filtered by the selection array |
| */ |
| std::unique_ptr<Type> buildSelectedType(const Type *fileType, |
| const std::vector<bool>& selected); |
| } |
| |
| #endif |