be/src/util/min-max-filter.cc - impala - Git at Google

 // Licensed to the Apache Software Foundation (ASF) under one
 // or more contributor license agreements.  See the NOTICE file
 // distributed with this work for additional information
 // regarding copyright ownership.  The ASF licenses this file
 // to you under the Apache License, Version 2.0 (the
 // "License"); you may not use this file except in compliance
 // with the License.  You may obtain a copy of the License at
 //
 //   http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing,
 // software distributed under the License is distributed on an
 // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, either express or implied.  See the License for the
 // specific language governing permissions and limitations
 // under the License.

 #include "util/min-max-filter.h"

 #include <sstream>
 #include <unordered_map>

 #include "common/object-pool.h"
 #include "runtime/date-value.h"
 #include "runtime/decimal-value.inline.h"
 #include "runtime/raw-value.h"
 #include "runtime/string-value.inline.h"
 #include "runtime/timestamp-value.inline.h"

 using std::numeric_limits;
 using std::stringstream;

 namespace impala {

 static std::unordered_map<int, string> MIN_MAX_FILTER_LLVM_CLASS_NAMES = {
     {PrimitiveType::TYPE_BOOLEAN, BoolMinMaxFilter::LLVM_CLASS_NAME},
     {PrimitiveType::TYPE_TINYINT, TinyIntMinMaxFilter::LLVM_CLASS_NAME},
     {PrimitiveType::TYPE_SMALLINT, SmallIntMinMaxFilter::LLVM_CLASS_NAME},
     {PrimitiveType::TYPE_INT, IntMinMaxFilter::LLVM_CLASS_NAME},
     {PrimitiveType::TYPE_BIGINT, BigIntMinMaxFilter::LLVM_CLASS_NAME},
     {PrimitiveType::TYPE_FLOAT, FloatMinMaxFilter::LLVM_CLASS_NAME},
     {PrimitiveType::TYPE_DOUBLE, DoubleMinMaxFilter::LLVM_CLASS_NAME},
     {PrimitiveType::TYPE_STRING, StringMinMaxFilter::LLVM_CLASS_NAME},
     {PrimitiveType::TYPE_TIMESTAMP, TimestampMinMaxFilter::LLVM_CLASS_NAME},
     {PrimitiveType::TYPE_DATE, DateMinMaxFilter::LLVM_CLASS_NAME},
     {PrimitiveType::TYPE_DECIMAL, DecimalMinMaxFilter::LLVM_CLASS_NAME}};

 static std::unordered_map<int, IRFunction::Type> MIN_MAX_FILTER_IR_FUNCTION_INSERT_TYPES =
     {{PrimitiveType::TYPE_BOOLEAN, IRFunction::BOOL_MIN_MAX_FILTER_INSERT},
         {PrimitiveType::TYPE_TINYINT, IRFunction::TINYINT_MIN_MAX_FILTER_INSERT},
         {PrimitiveType::TYPE_SMALLINT, IRFunction::SMALLINT_MIN_MAX_FILTER_INSERT},
         {PrimitiveType::TYPE_INT, IRFunction::INT_MIN_MAX_FILTER_INSERT},
         {PrimitiveType::TYPE_BIGINT, IRFunction::BIGINT_MIN_MAX_FILTER_INSERT},
         {PrimitiveType::TYPE_FLOAT, IRFunction::FLOAT_MIN_MAX_FILTER_INSERT},
         {PrimitiveType::TYPE_DOUBLE, IRFunction::DOUBLE_MIN_MAX_FILTER_INSERT},
         {PrimitiveType::TYPE_STRING, IRFunction::STRING_MIN_MAX_FILTER_INSERT},
         {PrimitiveType::TYPE_TIMESTAMP, IRFunction::TIMESTAMP_MIN_MAX_FILTER_INSERT},
         {PrimitiveType::TYPE_DATE, IRFunction::DATE_MIN_MAX_FILTER_INSERT}};

 static std::unordered_map<int, IRFunction::Type>
     DECIMAL_MIN_MAX_FILTER_IR_FUNCTION_INSERT_TYPES = {
         {DECIMAL_SIZE_4BYTE, IRFunction::DECIMAL_MIN_MAX_FILTER_INSERT4},
         {DECIMAL_SIZE_8BYTE, IRFunction::DECIMAL_MIN_MAX_FILTER_INSERT8},
         {DECIMAL_SIZE_16BYTE, IRFunction::DECIMAL_MIN_MAX_FILTER_INSERT16}};

 static std::unordered_map<int, IRFunction::Type>
     MIN_MAX_FILTER_IR_FUNCTION_ALWAYSTRUE_TYPES = {
         {PrimitiveType::TYPE_BOOLEAN, IRFunction::BOOL_MIN_MAX_FILTER_ALWAYSTRUE},
         {PrimitiveType::TYPE_TINYINT, IRFunction::TINYINT_MIN_MAX_FILTER_ALWAYSTRUE},
         {PrimitiveType::TYPE_SMALLINT, IRFunction::SMALLINT_MIN_MAX_FILTER_ALWAYSTRUE},
         {PrimitiveType::TYPE_INT, IRFunction::INT_MIN_MAX_FILTER_ALWAYSTRUE},
         {PrimitiveType::TYPE_BIGINT, IRFunction::BIGINT_MIN_MAX_FILTER_ALWAYSTRUE},
         {PrimitiveType::TYPE_FLOAT, IRFunction::FLOAT_MIN_MAX_FILTER_ALWAYSTRUE},
         {PrimitiveType::TYPE_DOUBLE, IRFunction::DOUBLE_MIN_MAX_FILTER_ALWAYSTRUE},
         {PrimitiveType::TYPE_STRING, IRFunction::STRING_MIN_MAX_FILTER_ALWAYSTRUE},
         {PrimitiveType::TYPE_TIMESTAMP, IRFunction::TIMESTAMP_MIN_MAX_FILTER_ALWAYSTRUE},
         {PrimitiveType::TYPE_DATE, IRFunction::DATE_MIN_MAX_FILTER_ALWAYSTRUE},
         {PrimitiveType::TYPE_DECIMAL, IRFunction::DECIMAL_MIN_MAX_FILTER_ALWAYSTRUE}
     };

 string MinMaxFilter::GetLlvmClassName(PrimitiveType type) {
   auto llvm_class = MIN_MAX_FILTER_LLVM_CLASS_NAMES.find(type);
   DCHECK(llvm_class != MIN_MAX_FILTER_LLVM_CLASS_NAMES.end())
       << "Not a valid type: " << type;
   return llvm_class->second;
 }

 IRFunction::Type MinMaxFilter::GetInsertIRFunctionType(ColumnType column_type) {
   if (column_type.type != PrimitiveType::TYPE_DECIMAL) {
     auto ir_function_type =
         MIN_MAX_FILTER_IR_FUNCTION_INSERT_TYPES.find(column_type.type);
     DCHECK(ir_function_type != MIN_MAX_FILTER_IR_FUNCTION_INSERT_TYPES.end())
         << "Not a valid type: " << column_type.type;
     return ir_function_type->second;
   } else {
     auto ir_function_type = DECIMAL_MIN_MAX_FILTER_IR_FUNCTION_INSERT_TYPES.find(
         ColumnType::GetDecimalByteSize(column_type.precision));
     DCHECK(ir_function_type != DECIMAL_MIN_MAX_FILTER_IR_FUNCTION_INSERT_TYPES.end())
         << "Not a valid precision: " << column_type.precision;
     return ir_function_type->second;
   }
 }

 IRFunction::Type MinMaxFilter::GetAlwaysTrueIRFunctionType(ColumnType column_type) {
   auto ir_function_type =
       MIN_MAX_FILTER_IR_FUNCTION_ALWAYSTRUE_TYPES.find(column_type.type);
   DCHECK(ir_function_type != MIN_MAX_FILTER_IR_FUNCTION_ALWAYSTRUE_TYPES.end())
       << "Not a valid type: " << column_type.type;
   return ir_function_type->second;
 }

 const char* MinMaxFilter::LLVM_CLASS_NAME = "class.impala::MinMaxFilter";

 int64_t GetIntTypeValue(const ColumnType& type, const void* value) {
   switch (type.type) {
     case TYPE_TINYINT:
       return *static_cast<const int8_t*>(value);
     case TYPE_SMALLINT:
       return *static_cast<const int16_t*>(value);
     case TYPE_INT:
       return *static_cast<const int32_t*>(value);
     case TYPE_BIGINT:
       return *static_cast<const int64_t*>(value);
     default:
       DCHECK(false) << "Not an int type: " << type;
   }
   return -1;
 }

 #define NUMERIC_MIN_MAX_FILTER_FUNCS(NAME, TYPE, PROTOBUF_TYPE, PRIMITIVE_TYPE)        \
   const char* NAME##MinMaxFilter::LLVM_CLASS_NAME =                                    \
       "class.impala::" #NAME "MinMaxFilter";                                           \
   NAME##MinMaxFilter::NAME##MinMaxFilter(const MinMaxFilterPB& protobuf) {             \
     if (protobuf.always_false()) {                                                     \
       min_ = numeric_limits<TYPE>::max();                                              \
       max_ = numeric_limits<TYPE>::lowest();                                           \
     } else if (protobuf.always_true()) {                                               \
       always_true_ = true;                                                             \
     } else {                                                                           \
       DCHECK(protobuf.has_min());                                                      \
       DCHECK(protobuf.has_max());                                                      \
       DCHECK(protobuf.min().has_##PROTOBUF_TYPE##_val());                              \
       DCHECK(protobuf.max().has_##PROTOBUF_TYPE##_val());                              \
       min_ = protobuf.min().PROTOBUF_TYPE##_val();                                     \
       max_ = protobuf.max().PROTOBUF_TYPE##_val();                                     \
     }                                                                                  \
   }                                                                                    \
   PrimitiveType NAME##MinMaxFilter::type() const {                                     \
     return PrimitiveType::TYPE_##PRIMITIVE_TYPE;                                       \
   }                                                                                    \
   void NAME##MinMaxFilter::ToProtobuf(MinMaxFilterPB* protobuf) const {                \
     if (!AlwaysFalse() && !AlwaysTrue()) {                                             \
       protobuf->mutable_min()->set_##PROTOBUF_TYPE##_val(min_);                        \
       protobuf->mutable_max()->set_##PROTOBUF_TYPE##_val(max_);                        \
     }                                                                                  \
     protobuf->set_always_false(AlwaysFalse());                                         \
     protobuf->set_always_true(AlwaysTrue());                                           \
   }                                                                                    \
   string NAME##MinMaxFilter::DebugString() const {                                     \
     stringstream out;                                                                  \
     out << #NAME << "MinMaxFilter(min=" << min_ << ", max=" << max_                    \
         << ", always_false=" << (AlwaysFalse() ? "true" : "false")                     \
         << ", always_true=" << (AlwaysTrue() ? "true" : "false") << ")";               \
     return out.str();                                                                  \
   }                                                                                    \
   void NAME##MinMaxFilter::Or(const MinMaxFilterPB& in, MinMaxFilterPB* out) {         \
     if (out->always_false()) {                                                         \
       out->mutable_min()->set_bool_val(in.min().PROTOBUF_TYPE##_val());                \
       out->mutable_max()->set_bool_val(in.max().PROTOBUF_TYPE##_val());                \
       out->set_always_false(false);                                                    \
     } else if (in.always_true() || out->always_true()) {                               \
       out->set_always_true(true);                                                      \
     } else {                                                                           \
       out->mutable_min()->set_##PROTOBUF_TYPE##_val(                                   \
           std::min(in.min().PROTOBUF_TYPE##_val(), out->min().PROTOBUF_TYPE##_val())); \
       out->mutable_max()->set_##PROTOBUF_TYPE##_val(                                   \
           std::max(in.max().PROTOBUF_TYPE##_val(), out->max().PROTOBUF_TYPE##_val())); \
     }                                                                                  \
   }                                                                                    \
   void NAME##MinMaxFilter::Copy(const MinMaxFilterPB& in, MinMaxFilterPB* out) {       \
     out->mutable_min()->set_##PROTOBUF_TYPE##_val(in.min().PROTOBUF_TYPE##_val());     \
     out->mutable_max()->set_##PROTOBUF_TYPE##_val(in.max().PROTOBUF_TYPE##_val());     \
   }

 NUMERIC_MIN_MAX_FILTER_FUNCS(Bool, bool, bool, BOOLEAN);
 NUMERIC_MIN_MAX_FILTER_FUNCS(TinyInt, int8_t, byte, TINYINT);
 NUMERIC_MIN_MAX_FILTER_FUNCS(SmallInt, int16_t, short, SMALLINT);
 NUMERIC_MIN_MAX_FILTER_FUNCS(Int, int32_t, int, INT);
 NUMERIC_MIN_MAX_FILTER_FUNCS(BigInt, int64_t, long, BIGINT);
 NUMERIC_MIN_MAX_FILTER_FUNCS(Float, float, double, FLOAT);
 NUMERIC_MIN_MAX_FILTER_FUNCS(Double, double, double, DOUBLE);

 int64_t GetIntTypeMax(const ColumnType& type) {
   switch (type.type) {
     case TYPE_TINYINT:
       return numeric_limits<int8_t>::max();
     case TYPE_SMALLINT:
       return numeric_limits<int16_t>::max();
     case TYPE_INT:
       return numeric_limits<int32_t>::max();
     case TYPE_BIGINT:
       return numeric_limits<int64_t>::max();
     default:
       DCHECK(false) << "Not an int type: " << type;
   }
   return -1;
 }

 int64_t GetIntTypeMin(const ColumnType& type) {
   switch (type.type) {
     case TYPE_TINYINT:
       return numeric_limits<int8_t>::lowest();
     case TYPE_SMALLINT:
       return numeric_limits<int16_t>::lowest();
     case TYPE_INT:
       return numeric_limits<int32_t>::lowest();
     case TYPE_BIGINT:
       return numeric_limits<int64_t>::lowest();
     default:
       DCHECK(false) << "Not an int type: " << type;
   }
   return -1;
 }

 #define NUMERIC_MIN_MAX_FILTER_CAST(NAME, TYPE)                                        \
   bool NAME##MinMaxFilter::GetCastIntMinMax(                                           \
       const ColumnType& col_type, int64_t* out_min, int64_t* out_max) const {          \
     /* If the primitive type of the filter is the same as the column type, */          \
     /* there is no chance of mis-alignment. */                                         \
     if (LIKELY(type() == col_type.type)) {                                             \
       *out_min = min_;                                                                 \
       *out_max = max_;                                                                 \
       return true;                                                                     \
     }                                                                                  \
     int64_t type_min = GetIntTypeMin(col_type);                                        \
     int64_t type_max = GetIntTypeMax(col_type);                                        \
     if (min_ < type_min) {                                                             \
       *out_min = type_min;                                                             \
     } else if (min_ > type_max) {                                                      \
       return false;                                                                    \
     } else {                                                                           \
       *out_min = min_;                                                                 \
     }                                                                                  \
     if (max_ > type_max) {                                                             \
       *out_max = type_max;                                                             \
     } else if (max_ < type_min) {                                                      \
       return false;                                                                    \
     } else {                                                                           \
       *out_max = max_;                                                                 \
     }                                                                                  \
     return true;                                                                       \
   }                                                                                    \
   bool NAME##MinMaxFilter::EvalOverlap(                                                \
       const ColumnType& col_type, void* data_min, void* data_max) const {              \
     /* Apply an optimization when the column type and the filter type are the same */  \
     if (LIKELY(type() == col_type.type)) {                                             \
       return !(max_ < *reinterpret_cast<TYPE*>(data_min)                               \
           || *reinterpret_cast<TYPE*>(data_max) < min_);                               \
     }                                                                                  \
     int64_t int_min;                                                                   \
     int64_t int_max;                                                                   \
     return EvalOverlap(col_type, data_min, data_max, &int_min, &int_max);              \
   }                                                                                    \
   bool NAME##MinMaxFilter::EvalOverlap(const ColumnType& type, void* data_min,         \
       void* data_max, int64_t* filter_min64, int64_t* filter_max64) const {            \
     if (LIKELY(GetCastIntMinMax(type, filter_min64, filter_max64))) {                  \
       return !(*filter_max64 < GetIntTypeValue(type, data_min)                         \
           || GetIntTypeValue(type, data_max) < *filter_min64);                         \
     }                                                                                  \
     /* If the filter min and max are not within the min and the*/                      \
     /* max of the type, then there is no chance of overlapping.*/                      \
     return false;                                                                      \
   }                                                                                    \
   float NAME##MinMaxFilter::ComputeOverlapRatio(                                       \
       const ColumnType& col_type, void* data_min, void* data_max) {                    \
     /* Apply an optimization when the column type and the filter type are the same */  \
     if (LIKELY(type() == col_type.type)) {                                             \
       if (EvalOverlap(col_type, data_min, data_max)) {                                 \
         /* If the filter completely covers the data range, return 1.0 */               \
         if (min_ <= *reinterpret_cast<TYPE*>(data_min)                                 \
             && *reinterpret_cast<TYPE*>(data_max) <= max_) {                           \
           return 1.0;                                                                  \
         }                                                                              \
         TYPE overlap_min = std::max(*reinterpret_cast<TYPE*>(data_min), min_);         \
         TYPE overlap_max = std::min(*reinterpret_cast<TYPE*>(data_max), max_);         \
         return (float)((double)(overlap_max - overlap_min + 1)                         \
             / (*reinterpret_cast<TYPE*>(data_max) - *reinterpret_cast<TYPE*>(data_min) \
                 + 1));                                                                 \
       } else {                                                                         \
         return 0.0;                                                                    \
       }                                                                                \
     }                                                                                  \
     int64_t filter_min64;                                                              \
     int64_t filter_max64;                                                              \
     if (EvalOverlap(col_type, data_min, data_max, &filter_min64, &filter_max64)) {     \
       int64_t data_min64 = GetIntTypeValue(col_type, data_min);                        \
       int64_t data_max64 = GetIntTypeValue(col_type, data_max);                        \
       /* If the filter completely covers the data range, return 1.0 */                 \
       if (filter_min64 <= data_min64 && data_max64 <= filter_max64) {                  \
         return 1.0;                                                                    \
       }                                                                                \
       int64_t overlap_min = std::max(data_min64, filter_min64);                        \
       int64_t overlap_max = std::min(data_max64, filter_max64);                        \
       return (float)((double)(overlap_max - overlap_min + 1)                           \
           / (data_max64 - data_min64 + 1));                                            \
     } else {                                                                           \
       return 0.0;                                                                      \
     }                                                                                  \
   }

 NUMERIC_MIN_MAX_FILTER_CAST(TinyInt, int8_t);
 NUMERIC_MIN_MAX_FILTER_CAST(SmallInt, int16_t);
 NUMERIC_MIN_MAX_FILTER_CAST(Int, int32_t);
 NUMERIC_MIN_MAX_FILTER_CAST(BigInt, int64_t);

 float TinyIntMinMaxFilter::ComputeOverlapRatio(
     const ColumnType& type, const TColumnValue& data_min, const TColumnValue& data_max) {
   return ComputeOverlapRatio(
       type, (void*)&data_min.byte_val, (void*)&data_max.byte_val);
 }

 float SmallIntMinMaxFilter::ComputeOverlapRatio(
     const ColumnType& type, const TColumnValue& data_min, const TColumnValue& data_max) {
   return ComputeOverlapRatio(
       type, (void*)&data_min.short_val, (void*)&data_max.short_val);
 }

 float IntMinMaxFilter::ComputeOverlapRatio(
     const ColumnType& type, const TColumnValue& data_min, const TColumnValue& data_max) {
   return ComputeOverlapRatio(
       type, (void*)&data_min.int_val, (void*)&data_max.int_val);
 }

 float BigIntMinMaxFilter::ComputeOverlapRatio(
     const ColumnType& type, const TColumnValue& data_min, const TColumnValue& data_max) {
   return ComputeOverlapRatio(
       type, (void*)&data_min.long_val, (void*)&data_max.long_val);
 }

 #define NUMERIC_MIN_MAX_FILTER_NO_CAST(NAME, TYPE)                                     \
   bool NAME##MinMaxFilter::GetCastIntMinMax(                                           \
       const ColumnType& type, int64_t* out_min, int64_t* out_max) const {              \
     DCHECK(false) << "Casting min-max filters of type " << #NAME << " not supported."; \
     return true;                                                                       \
   }

 bool BoolMinMaxFilter::EvalOverlap(
     const ColumnType& type, void* data_min, void* data_max) const {
   return !(max_ < *(bool*)data_min || *(bool*)data_max < min_);
 }

 float BoolMinMaxFilter::ComputeOverlapRatio(
     const ColumnType& type, void* data_min, void* data_max) {
   // For Booleans, if there is an overlap, then it is always 1.0.
   return (EvalOverlap(type, data_min, data_max)) ? 1.0 : 0.0;
 }

 float BoolMinMaxFilter::ComputeOverlapRatio(
     const ColumnType& type, const TColumnValue& data_min, const TColumnValue& data_max) {
   return -1;
 }

 #define APPROXIMATE_NUMERIC_MIN_MAX_FILTER_EVAL_OVERLAP(NAME, TYPE)                 \
   bool NAME##MinMaxFilter::EvalOverlap(                                             \
       const ColumnType& type, void* data_min, void* data_max) const {               \
     return !(max_ < *(TYPE*)data_min || *(TYPE*)data_max < min_);                   \
   }                                                                                 \
   float NAME##MinMaxFilter::ComputeOverlapRatio(                                    \
       const ColumnType& type, void* data_min_ptr, void* data_max_ptr) {             \
     TYPE data_min = *(TYPE*)data_min_ptr;                                           \
     TYPE data_max = *(TYPE*)data_max_ptr;                                           \
     /* If the filter completely covers the data range, return 1.0 */                \
     if (min_ <= data_min && data_max <= max_) {                                     \
       return 1.0;                                                                   \
     }                                                                               \
     TYPE overlap_min = std::max(min_, data_min);                                    \
     TYPE overlap_max = std::min(max_, data_max);                                    \
     return (overlap_max - overlap_min + 1) / (data_max - data_min + 1);             \
   }                                                                                 \
   float NAME##MinMaxFilter::ComputeOverlapRatio(const ColumnType& type,             \
       const TColumnValue& data_min, const TColumnValue& data_max) {                 \
     return ComputeOverlapRatio(                                                     \
         type, (void*)&data_min.double_val, (void*)&data_max.double_val);            \
   }

 NUMERIC_MIN_MAX_FILTER_NO_CAST(Bool, bool);
 NUMERIC_MIN_MAX_FILTER_NO_CAST(Float, float);
 NUMERIC_MIN_MAX_FILTER_NO_CAST(Double, double);

 APPROXIMATE_NUMERIC_MIN_MAX_FILTER_EVAL_OVERLAP(Float, float);
 APPROXIMATE_NUMERIC_MIN_MAX_FILTER_EVAL_OVERLAP(Double, double);

 // STRING
 const char* StringMinMaxFilter::LLVM_CLASS_NAME = "class.impala::StringMinMaxFilter";
 const int StringMinMaxFilter::MAX_BOUND_LENGTH = 1024;

 const std::string StringMinMaxFilter::min_string("\0", 1);
 const std::string StringMinMaxFilter::max_string(MAX_BOUND_LENGTH, (uint8_t)0xff);

 const StringValue StringMinMaxFilter::MIN_BOUND_STRING(min_string);
 const StringValue StringMinMaxFilter::MAX_BOUND_STRING(max_string);

 StringMinMaxFilter::StringMinMaxFilter(
     const MinMaxFilterPB& protobuf, MemTracker* mem_tracker)
   : mem_pool_(mem_tracker), min_buffer_(&mem_pool_), max_buffer_(&mem_pool_) {
   always_false_ = protobuf.always_false();
   always_true_ = protobuf.always_true();
   if (!always_true_ && !always_false_) {
     DCHECK(protobuf.has_min());
     DCHECK(protobuf.has_max());
     DCHECK(protobuf.min().has_string_val());
     DCHECK(protobuf.max().has_string_val());
     min_ = StringValue(protobuf.min().string_val());
     max_ = StringValue(protobuf.max().string_val());
     CopyToBuffer(&min_buffer_, &min_, min_.Len());
     CopyToBuffer(&max_buffer_, &max_, max_.Len());
   }
 }

 PrimitiveType StringMinMaxFilter::type() const {
   return PrimitiveType::TYPE_STRING;
 }

 void StringMinMaxFilter::MaterializeMinValue() {
   if (min_.Len() > MAX_BOUND_LENGTH) {
     // Truncating 'value' gives a valid min bound as the result will be <= 'value'.
     CopyToBuffer(&min_buffer_, &min_, MAX_BOUND_LENGTH);
   } else {
     CopyToBuffer(&min_buffer_, &min_, min_.Len());
   }
 }

 void StringMinMaxFilter::MaterializeMaxValue() {
   if (max_.Len() > MAX_BOUND_LENGTH) {
     CopyToBuffer(&max_buffer_, &max_, MAX_BOUND_LENGTH);
     if (always_true_) return;
     // After truncating 'value', to still have a valid max bound we add 1 to one char in
     // the string, so that the result will be > 'value'. If the entire string is already
     // the max char, then disable this filter by making it always_true.
     int i = MAX_BOUND_LENGTH - 1;
     while (i >= 0 && static_cast<int32_t>(max_buffer_.buffer()[i]) == -1) {
       max_buffer_.buffer()[i] = max_buffer_.buffer()[i] + 1;
       --i;
     }
     if (i == -1) {
       SetAlwaysTrue();
       return;
     }
     max_buffer_.buffer()[i] = max_buffer_.buffer()[i] + 1;
   } else {
     CopyToBuffer(&max_buffer_, &max_, max_.Len());
   }
 }

 void StringMinMaxFilter::MaterializeValues() {
   if (always_true_ || always_false_) return;
   if (min_buffer_.IsEmpty()) MaterializeMinValue();
   if (max_buffer_.IsEmpty()) MaterializeMaxValue();
 }

 void StringMinMaxFilter::ToProtobuf(MinMaxFilterPB* protobuf) const {
   if (!always_true_ && !always_false_) {
     protobuf->mutable_min()->set_string_val(min_.Ptr(), min_.Len());
     protobuf->mutable_max()->set_string_val(max_.Ptr(), max_.Len());
   }
   protobuf->set_always_false(always_false_);
   protobuf->set_always_true(always_true_);
 }

 string StringMinMaxFilter::DebugString() const {
   stringstream out;
   out << "StringMinMaxFilter(min=" << min_ << ", max=" << max_
       << ", always_false=" << (always_false_ ? "true" : "false")
       << ", always_true=" << (always_true_ ? "true" : "false") << ")";
   return out.str();
 }

 void StringMinMaxFilter::Or(const MinMaxFilterPB& in, MinMaxFilterPB* out) {
   if (out->always_false()) {
     out->mutable_min()->set_string_val(in.min().string_val());
     out->mutable_max()->set_string_val(in.max().string_val());
     out->set_always_false(false);
   } else {
     if (in.always_true() || out->always_true()) {
       out->set_always_true(true);
     } else {
       StringValue in_min_val = StringValue(in.min().string_val());
       StringValue out_min_val = StringValue(out->min().string_val());
       if (in_min_val < out_min_val)
         out->mutable_min()->set_string_val(in.min().string_val());
       StringValue in_max_val = StringValue(in.max().string_val());
       StringValue out_max_val = StringValue(out->max().string_val());
       if (in_max_val > out_max_val)
         out->mutable_max()->set_string_val(in.max().string_val());
     }
   }
 }

 void StringMinMaxFilter::Copy(const MinMaxFilterPB& in, MinMaxFilterPB* out) {
   out->mutable_min()->set_string_val(in.min().string_val());
   out->mutable_max()->set_string_val(in.max().string_val());
 }

 void StringMinMaxFilter::CopyToBuffer(
     StringBuffer* buffer, StringValue* value, int64_t len) {
   if (value->Ptr() == buffer->buffer()) return;
   if (value->IsSmall()) {
     DCHECK_LE(value->Len(), len);
     return;
   }
   buffer->Clear();
   if (!buffer->Append(value->Ptr(), len).ok()) {
     // If Append() fails, for example because we're out of memory, disable the filter.
     SetAlwaysTrue();
     return;
   }
   value->Assign(buffer->buffer(), len);
 }

 void StringMinMaxFilter::SetAlwaysTrue() {
   always_true_ = true;
   always_false_ = false;
   max_buffer_.Clear();
   min_buffer_.Clear();
   min_.Clear();
   max_.Clear();
 }

 bool StringMinMaxFilter::EvalOverlap(
     const ColumnType& type, void* data_min, void* data_max) const {
   return !((*(StringValue*)data_max) < min_ || max_ < (*(StringValue*)data_min));
 }

 float StringMinMaxFilter::ComputeOverlapRatio(
     const ColumnType& type, void* data_min_ptr, void* data_max_ptr) {
   StringValue* data_min = (StringValue*)data_min_ptr;
   StringValue* data_max = (StringValue*)data_max_ptr;
   /* If the filter completely covers the data range, return 1.0*/
   if (min_ <= *data_min && *data_max <= max_) {
     return 1.0;
   }
   uint64_t data_min64 = data_min->ToUInt64();
   uint64_t data_max64 = data_max->ToUInt64();
   uint64_t filter_min64 = min_.ToUInt64();
   uint64_t filter_max64 = max_.ToUInt64();
   uint64_t overlap_min = std::max(filter_min64, data_min64);
   uint64_t overlap_max = std::min(filter_max64, data_max64);
   return (float)((double)(overlap_max - overlap_min + 1)) / (data_max64 - data_min64 + 1);
 }

 // TIMESTAMP and DATE
 #define DATE_TIME_MIN_MAX_FILTER_FUNCS(NAME, TYPE, PROTOBUF_TYPE, PRIMITIVE_TYPE)      \
   const char* NAME##MinMaxFilter::LLVM_CLASS_NAME =                                    \
       "class.impala::" #NAME "MinMaxFilter";                                           \
   NAME##MinMaxFilter::NAME##MinMaxFilter(const MinMaxFilterPB& protobuf) {             \
     always_false_ = protobuf.always_false();                                           \
     always_true_ = protobuf.always_true();                                             \
     if (!always_false_ && !always_true_) {                                             \
       DCHECK(protobuf.min().has_##PROTOBUF_TYPE##_val());                              \
       DCHECK(protobuf.max().has_##PROTOBUF_TYPE##_val());                              \
       min_ = TYPE::FromColumnValuePB(protobuf.min());                                  \
       max_ = TYPE::FromColumnValuePB(protobuf.max());                                  \
     }                                                                                  \
   }                                                                                    \
   PrimitiveType NAME##MinMaxFilter::type() const {                                     \
     return PrimitiveType::TYPE_##PRIMITIVE_TYPE;                                       \
   }                                                                                    \
   void NAME##MinMaxFilter::ToProtobuf(MinMaxFilterPB* protobuf) const {                \
     if (!always_false_ && !always_true_) {                                             \
       min_.ToColumnValuePB(protobuf->mutable_min());                                   \
       max_.ToColumnValuePB(protobuf->mutable_max());                                   \
     }                                                                                  \
     protobuf->set_always_false(always_false_);                                         \
     protobuf->set_always_true(always_true_);                                           \
   }                                                                                    \
   string NAME##MinMaxFilter::DebugString() const {                                     \
     stringstream out;                                                                  \
     out << #NAME << "MinMaxFilter(min=" << min_ << ", max=" << max_                    \
         << ", always_false=" << (always_false_ ? "true" : "false")                     \
         << ", always_true=" << (always_false_ ? "true" : "false") << ")";              \
     return out.str();                                                                  \
   }                                                                                    \
   void NAME##MinMaxFilter::Or(const MinMaxFilterPB& in, MinMaxFilterPB* out) {         \
     if (out->always_false()) {                                                         \
       out->mutable_min()->set_##PROTOBUF_TYPE##_val(in.min().PROTOBUF_TYPE##_val());   \
       out->mutable_max()->set_##PROTOBUF_TYPE##_val(in.max().PROTOBUF_TYPE##_val());   \
       out->set_always_false(false);                                                    \
     } else if (in.always_true() || out->always_true()) {                               \
       out->set_always_true(true);                                                      \
     } else {                                                                           \
       TYPE in_min_val = TYPE::FromColumnValuePB(in.min());                             \
       TYPE out_min_val = TYPE::FromColumnValuePB(out->min());                          \
       if (in_min_val < out_min_val) {                                                  \
         out->mutable_min()->set_##PROTOBUF_TYPE##_val(in.min().PROTOBUF_TYPE##_val()); \
       }                                                                                \
       TYPE in_max_val = TYPE::FromColumnValuePB(in.max());                             \
       TYPE out_max_val = TYPE::FromColumnValuePB(out->max());                          \
       if (in_max_val > out_max_val) {                                                  \
         out->mutable_max()->set_##PROTOBUF_TYPE##_val(in.max().PROTOBUF_TYPE##_val()); \
       }                                                                                \
     }                                                                                  \
   }                                                                                    \
   void NAME##MinMaxFilter::Copy(const MinMaxFilterPB& in, MinMaxFilterPB* out) {       \
     out->mutable_min()->set_##PROTOBUF_TYPE##_val(in.min().PROTOBUF_TYPE##_val());     \
     out->mutable_max()->set_##PROTOBUF_TYPE##_val(in.max().PROTOBUF_TYPE##_val());     \
   }                                                                                    \
   bool NAME##MinMaxFilter::EvalOverlap(                                                \
       const ColumnType& type, void* data_min, void* data_max) const {                  \
     return !((*(TYPE*)data_max) < min_ || max_ < (*(TYPE*)data_min));                  \
   }

 DATE_TIME_MIN_MAX_FILTER_FUNCS(Timestamp, TimestampValue, timestamp, TIMESTAMP);
 DATE_TIME_MIN_MAX_FILTER_FUNCS(Date, DateValue, date, DATE);

 float TimestampMinMaxFilter::ComputeOverlapRatio(
     const ColumnType& type, void* data_min_ptr, void* data_max_ptr) {
   TimestampValue* data_min = (TimestampValue*)data_min_ptr;
   TimestampValue* data_max = (TimestampValue*)data_max_ptr;
   /* If the filter completely covers the data range, return 1.0 */
   if (min_ <= *data_min && *data_max <= max_) {
     return 1.0;
   }
   int64_t data_min_in_ns = 0;
   int64_t data_max_in_ns = 0;
   int64_t filter_min_in_ns = 0;
   int64_t filter_max_in_ns = 0;
   if (!data_min->UtcToUnixTimeLimitedRangeNanos(&data_min_in_ns)
       || !data_max->UtcToUnixTimeLimitedRangeNanos(&data_max_in_ns)
       || !min_.UtcToUnixTimeLimitedRangeNanos(&filter_min_in_ns)
       || !max_.UtcToUnixTimeLimitedRangeNanos(&filter_max_in_ns))
     return 1.0;

   int64_t overlap_min = std::max(filter_min_in_ns, data_min_in_ns);
   int64_t overlap_max = std::min(filter_max_in_ns, data_max_in_ns);
   return (float)(overlap_max - overlap_min + 1) / (data_max_in_ns - data_min_in_ns + 1);
 }

 float TimestampMinMaxFilter::ComputeOverlapRatio(
     const ColumnType& type, const TColumnValue& data_min, const TColumnValue& data_max) {
   return 0.0;
 }

 float DateMinMaxFilter::ComputeOverlapRatio(
     const ColumnType& type, void* data_min_ptr, void* data_max_ptr) {
   DateValue* data_min = (DateValue*)data_min_ptr;
   DateValue* data_max = (DateValue*)data_max_ptr;
   /* If the filter completely covers the data range, return 1.0 */
   if (min_ <= *data_min && *data_max <= max_) {
     return 1.0;
   }
   int32_t data_days_min = data_min->Value();
   int32_t data_days_max = data_max->Value();
   int32_t filter_days_min = min_.Value();
   int32_t filter_days_max = max_.Value();
   int32_t overlap_min = std::max(filter_days_min, data_days_min);
   int32_t overlap_max = std::min(filter_days_max, data_days_max);
   return (float)(overlap_max - overlap_min + 1) / (data_days_max - data_days_min + 1);
 }

 float DateMinMaxFilter::ComputeOverlapRatio(
     const ColumnType& type, const TColumnValue& data_min, const TColumnValue& data_max) {
   return ComputeOverlapRatio(
       type, (void*)&data_min.date_val, (void*)&data_max.date_val);
 }

 // DECIMAL
 const char* DecimalMinMaxFilter::LLVM_CLASS_NAME = "class.impala::DecimalMinMaxFilter";
 #define DECIMAL_SET_MINMAX(SIZE)                                            \
   do {                                                                      \
     DCHECK(protobuf.min().has_decimal_val());                               \
     DCHECK(protobuf.max().has_decimal_val());                               \
     min##SIZE##_ = Decimal##SIZE##Value::FromColumnValuePB(protobuf.min()); \
     max##SIZE##_ = Decimal##SIZE##Value::FromColumnValuePB(protobuf.max()); \
   } while (false)

 // Construct the Decimal min-max filter when the min-max filter information
 // comes in through thrift.  This can get called in coordinator, after the filter
 // is sent by executor
 DecimalMinMaxFilter::DecimalMinMaxFilter(const MinMaxFilterPB& protobuf, int precision)
   : size_(ColumnType::GetDecimalByteSize(precision)),
     always_false_(protobuf.always_false()) {
   always_true_ = protobuf.always_true();
   if (!always_false_ && !always_true_) {
     switch (size_) {
       case DECIMAL_SIZE_4BYTE:
         DECIMAL_SET_MINMAX(4);
         break;
       case DECIMAL_SIZE_8BYTE:
         DECIMAL_SET_MINMAX(8);
         break;
       case DECIMAL_SIZE_16BYTE:
         DECIMAL_SET_MINMAX(16);
         break;
       default:
         DCHECK(false) << "DecimalMinMaxFilter: Unknown decimal byte size: " << size_;
     }
   }
 }

 PrimitiveType DecimalMinMaxFilter::type() const {
   return PrimitiveType::TYPE_DECIMAL;
 }

 #define DECIMAL_TO_PROTOBUF(SIZE)                          \
   do {                                                     \
     min##SIZE##_.ToColumnValuePB(protobuf->mutable_min()); \
     max##SIZE##_.ToColumnValuePB(protobuf->mutable_max()); \
   } while (false)

 // Construct a thrift min-max filter.  Will be called by the executor
 // to be sent to the coordinator
 void DecimalMinMaxFilter::ToProtobuf(MinMaxFilterPB* protobuf) const {
   if (!always_false_ && !always_true_) {
     switch (size_) {
       case DECIMAL_SIZE_4BYTE:
         DECIMAL_TO_PROTOBUF(4);
         break;
       case DECIMAL_SIZE_8BYTE:
         DECIMAL_TO_PROTOBUF(8);
         break;
       case DECIMAL_SIZE_16BYTE:
         DECIMAL_TO_PROTOBUF(16);
         break;
       default:
         DCHECK(false) << "DecimalMinMaxFilter: Unknown decimal byte size: " << size_;
     }
   }
   protobuf->set_always_false(always_false_);
   protobuf->set_always_true(always_true_);
 }

 void DecimalMinMaxFilter::Insert(const void* val) {
   if (val == nullptr) return;
   switch (size_) {
     case 4:
       Insert4(val);
       break;
     case 8:
       Insert8(val);
       break;
     case 16:
       Insert16(val);
       break;
     default:
       DCHECK(false) << "Unknown decimal size: " << size_;
   }
 }

 void DecimalMinMaxFilter::InsertForLE(const void* val) {
   if (val == nullptr) return;
   switch (size_) {
     case 4:
       Insert4ForLE(val);
       break;
     case 8:
       Insert8ForLE(val);
       break;
     case 16:
       Insert16ForLE(val);
       break;
     default:
       DCHECK(false) << "Unknown decimal size: " << size_;
   }
 }

 void DecimalMinMaxFilter::InsertForGE(const void* val) {
   if (val == nullptr) return;
   switch (size_) {
     case 4:
       Insert4ForGE(val);
       break;
     case 8:
       Insert8ForGE(val);
       break;
     case 16:
       Insert16ForGE(val);
       break;
     default:
       DCHECK(false) << "Unknown decimal size: " << size_;
   }
 }

 void DecimalMinMaxFilter::InsertForLT(const void* val) {
   if (val == nullptr) return;
   switch (size_) {
     case 4:
       Insert4ForLT(val);
       break;
     case 8:
       Insert8ForLT(val);
       break;
     case 16:
       Insert16ForLT(val);
       break;
     default:
       DCHECK(false) << "Unknown decimal size: " << size_;
   }
 }

 void DecimalMinMaxFilter::InsertForGT(const void* val) {
   if (val == nullptr) return;
   switch (size_) {
     case 4:
       Insert4ForGT(val);
       break;
     case 8:
       Insert8ForGT(val);
       break;
     case 16:
       Insert16ForGT(val);
       break;
     default:
       DCHECK(false) << "Unknown decimal size: " << size_;
   }
 }

 #define DECIMAL_DEBUG_STRING(SIZE)                                                 \
   do {                                                                             \
     out << "DecimalMinMaxFilter(min=" << min##SIZE##_ << ", max=" << max##SIZE##_  \
         << ", always_false=" << (always_false_ ? "true" : "false")                 \
         << ", always_true=" << (always_false_ ? "true" : "false") << ")";          \
   } while (false)

 string DecimalMinMaxFilter::DebugString() const {
   stringstream out;

   switch (size_) {
     case DECIMAL_SIZE_4BYTE:
       DECIMAL_DEBUG_STRING(4);
       break;
     case DECIMAL_SIZE_8BYTE:
       DECIMAL_DEBUG_STRING(8);
       break;
     case DECIMAL_SIZE_16BYTE:
       DECIMAL_DEBUG_STRING(16);
       break;
     default:
       DCHECK(false) << "DecimalMinMaxFilter: Unknown decimal byte size: " << size_;
   }

   return out.str();
 }

 #define DECIMAL_OR(SIZE)                                           \
   do {                                                             \
     if (Decimal##SIZE##Value::FromColumnValuePB(in.min())          \
         < Decimal##SIZE##Value::FromColumnValuePB(out->min()))     \
       out->mutable_min()->set_decimal_val(in.min().decimal_val()); \
     if (Decimal##SIZE##Value::FromColumnValuePB(in.max())          \
         > Decimal##SIZE##Value::FromColumnValuePB(out->max()))     \
       out->mutable_max()->set_decimal_val(in.max().decimal_val()); \
   } while (false)

 void DecimalMinMaxFilter::Or(
     const MinMaxFilterPB& in, MinMaxFilterPB* out, int precision) {
   if (in.always_false()) {
     return;
   } else if (out->always_false()) {
     out->mutable_min()->set_decimal_val(in.min().decimal_val());
     out->mutable_max()->set_decimal_val(in.max().decimal_val());
     out->set_always_false(false);
   } else if (in.always_true() || out->always_true()) {
     out->set_always_true(true);
   } else {
     int size = ColumnType::GetDecimalByteSize(precision);
     switch (size) {
       case DECIMAL_SIZE_4BYTE:
         DECIMAL_OR(4);
         break;
       case DECIMAL_SIZE_8BYTE:
         DECIMAL_OR(8);
         break;
       case DECIMAL_SIZE_16BYTE:
         DECIMAL_OR(16);
         break;
       default:
         DCHECK(false) << "Unknown decimal size: " << size;
     }
   }
 }

 void DecimalMinMaxFilter::Copy(const MinMaxFilterPB& in, MinMaxFilterPB* out) {
   out->mutable_min()->set_decimal_val(in.min().decimal_val());
   out->mutable_max()->set_decimal_val(in.max().decimal_val());
 }

 bool DecimalMinMaxFilter::EvalOverlap(
     const ColumnType& type, void* data_min, void* data_max) const {
   bool overlap = true;
   switch (type.GetByteSize()) {
     case 4:
       overlap =
           !((*(Decimal4Value*)data_max) < min4_ || max4_ < (*(Decimal4Value*)data_min));
       break;
     case 8:
       overlap =
           !((*(Decimal8Value*)data_max) < min8_ || max8_ < (*(Decimal8Value*)data_min));
       break;
     case 16:
       overlap = !(
           (*(Decimal16Value*)data_max) < min16_ || max16_ < (*(Decimal16Value*)data_min));
       break;
     default:
       DCHECK(false) << "DecimalMinMaxFilter: Unknown decimal byte size: "
                     << type.GetByteSize();
   }
   return overlap;
 }

 float DecimalMinMaxFilter::ComputeOverlapRatio(
     const ColumnType& type, void* data_min_ptr, void* data_max_ptr) {
   double data_min = 0;
   double data_max = 0;
   double filter_min = 0;
   double filter_max = 0;
   switch (type.GetByteSize()) {
     case 4:
       data_min = ((Decimal4Value*)data_min_ptr)->ToDouble(type.scale);
       data_max = ((Decimal4Value*)data_max_ptr)->ToDouble(type.scale);
       filter_min = min4_.ToDouble(type.scale);
       filter_max = max4_.ToDouble(type.scale);
       break;
     case 8:
       data_min = ((Decimal8Value*)data_min_ptr)->ToDouble(type.scale);
       data_max = ((Decimal8Value*)data_max_ptr)->ToDouble(type.scale);
       filter_min = min8_.ToDouble(type.scale);
       filter_max = max8_.ToDouble(type.scale);
       break;
     case 16:
       data_min = ((Decimal16Value*)data_min_ptr)->ToDouble(type.scale);
       data_max = ((Decimal16Value*)data_max_ptr)->ToDouble(type.scale);
       filter_min = min16_.ToDouble(type.scale);
       filter_max = max16_.ToDouble(type.scale);
       break;
     default:
       DCHECK(false) << "DecimalMinMaxFilter: Unknown decimal byte size: "
                     << type.GetByteSize();
   }
   /* If the filter completely covers the data range, return 1.0*/
   if (filter_min <= data_min && data_max <= filter_max) {
     return 1.0;
   }
   double overlap_min = std::max(filter_min, data_min);
   double overlap_max = std::min(filter_max, data_max);
   return (float)((overlap_max - overlap_min + 1) / (data_max - data_min + 1));
 }

 float DecimalMinMaxFilter::ComputeOverlapRatio(
     const ColumnType& type, const TColumnValue& data_min, const TColumnValue& data_max) {
   ColumnValuePB min_pb, max_pb;
   min_pb.set_decimal_val(data_min.decimal_val); // decimal_val is std::string
   max_pb.set_decimal_val(data_max.decimal_val);
   switch (type.GetByteSize()) {
     case 4: {
       Decimal4Value min = Decimal4Value::FromColumnValuePB(min_pb);
       Decimal4Value max = Decimal4Value::FromColumnValuePB(max_pb);
       return ComputeOverlapRatio(type, (void*)&min, (void*)&max);
     }
     case 8: {
       Decimal8Value min = Decimal8Value::FromColumnValuePB(min_pb);
       Decimal8Value max = Decimal8Value::FromColumnValuePB(max_pb);
       return ComputeOverlapRatio(type, (void*)&min, (void*)&max);
     }
     case 16: {
       Decimal16Value min = Decimal16Value::FromColumnValuePB(min_pb);
       Decimal16Value max = Decimal16Value::FromColumnValuePB(max_pb);
       return ComputeOverlapRatio(type, (void*)&min, (void*)&max);
     }
     default:
       DCHECK(false) << "DecimalMinMaxFilter: Unknown decimal byte size: "
                     << type.GetByteSize();
   }
   // Impossible to reach
   return 0;
 }

 bool MinMaxFilter::GetCastIntMinMax(
     const ColumnType& type, int64_t* out_min, int64_t* out_max) const {
   DCHECK(false) << "Casting min-max filters of type " << this->type()
       << " not supported.";
   return true;
 }

 MinMaxFilter* MinMaxFilter::Create(
     ColumnType type, ObjectPool* pool, MemTracker* mem_tracker) {
   switch (type.type) {
     case PrimitiveType::TYPE_BOOLEAN:
       return pool->Add(new BoolMinMaxFilter());
     case PrimitiveType::TYPE_TINYINT:
       return pool->Add(new TinyIntMinMaxFilter());
     case PrimitiveType::TYPE_SMALLINT:
       return pool->Add(new SmallIntMinMaxFilter());
     case PrimitiveType::TYPE_INT:
       return pool->Add(new IntMinMaxFilter());
     case PrimitiveType::TYPE_BIGINT:
       return pool->Add(new BigIntMinMaxFilter());
     case PrimitiveType::TYPE_FLOAT:
       return pool->Add(new FloatMinMaxFilter());
     case PrimitiveType::TYPE_DOUBLE:
       return pool->Add(new DoubleMinMaxFilter());
     case PrimitiveType::TYPE_STRING:
       return pool->Add(new StringMinMaxFilter(mem_tracker));
     case PrimitiveType::TYPE_TIMESTAMP:
       return pool->Add(new TimestampMinMaxFilter());
     case PrimitiveType::TYPE_DATE:
       return pool->Add(new DateMinMaxFilter());
     case PrimitiveType::TYPE_DECIMAL:
       return pool->Add(new DecimalMinMaxFilter(type.precision));
     default:
       DCHECK(false) << "Unsupported MinMaxFilter type: " << type;
   }
   return nullptr;
 }

 MinMaxFilter* MinMaxFilter::Create(const MinMaxFilterPB& protobuf, ColumnType type,
     ObjectPool* pool, MemTracker* mem_tracker) {
   switch (type.type) {
     case PrimitiveType::TYPE_BOOLEAN:
       return pool->Add(new BoolMinMaxFilter(protobuf));
     case PrimitiveType::TYPE_TINYINT:
       return pool->Add(new TinyIntMinMaxFilter(protobuf));
     case PrimitiveType::TYPE_SMALLINT:
       return pool->Add(new SmallIntMinMaxFilter(protobuf));
     case PrimitiveType::TYPE_INT:
       return pool->Add(new IntMinMaxFilter(protobuf));
     case PrimitiveType::TYPE_BIGINT:
       return pool->Add(new BigIntMinMaxFilter(protobuf));
     case PrimitiveType::TYPE_FLOAT:
       return pool->Add(new FloatMinMaxFilter(protobuf));
     case PrimitiveType::TYPE_DOUBLE:
       return pool->Add(new DoubleMinMaxFilter(protobuf));
     case PrimitiveType::TYPE_STRING:
       return pool->Add(new StringMinMaxFilter(protobuf, mem_tracker));
     case PrimitiveType::TYPE_TIMESTAMP:
       return pool->Add(new TimestampMinMaxFilter(protobuf));
     case PrimitiveType::TYPE_DATE:
       return pool->Add(new DateMinMaxFilter(protobuf));
     case PrimitiveType::TYPE_DECIMAL:
       return pool->Add(new DecimalMinMaxFilter(protobuf, type.precision));
     default:
       DCHECK(false) << "Unsupported MinMaxFilter type: " << type;
   }
   return nullptr;
 }

 void MinMaxFilter::Or(const MinMaxFilter& other) {
   if (other.AlwaysFalse()) return; // Updating with always false is a no-op.
   if (other.AlwaysTrue()) {
     SetAlwaysTrue();
     return;
   }
   // 'other' should have valid min and max values, so we can simply update this
   // filter with those to get the correct result.
   Insert(other.GetMin());
   Insert(other.GetMax());
 }

 void MinMaxFilter::Or(
     const MinMaxFilterPB& in, MinMaxFilterPB* out, const ColumnType& columnType) {
   if (in.always_false() || out->always_true()) return;
   if (in.always_true()) {
     out->set_always_true(true);
     return;
   }
   if (in.min().has_bool_val()) {
     DCHECK(out->min().has_bool_val());
     BoolMinMaxFilter::Or(in, out);
     return;
   } else if (in.min().has_byte_val()) {
     DCHECK(out->min().has_byte_val());
     TinyIntMinMaxFilter::Or(in, out);
     return;
   } else if (in.min().has_short_val()) {
     DCHECK(out->min().has_short_val());
     SmallIntMinMaxFilter::Or(in, out);
     return;
   } else if (in.min().has_int_val()) {
     DCHECK(out->min().has_int_val());
     IntMinMaxFilter::Or(in, out);
     return;
   } else if (in.min().has_long_val()) {
     DCHECK(out->min().has_long_val());
     BigIntMinMaxFilter::Or(in, out);
     return;
   } else if (in.min().has_double_val()) {
     // Handles FloatMinMaxFilter also as TColumnValue doesn't have a float type.
     DCHECK(out->min().has_double_val());
     DoubleMinMaxFilter::Or(in, out);
     return;
   } else if (in.min().has_string_val()) {
     DCHECK(out->min().has_string_val());
     StringMinMaxFilter::Or(in, out);
     return;
   } else if (in.min().has_timestamp_val()) {
     DCHECK(out->min().has_timestamp_val());
     TimestampMinMaxFilter::Or(in, out);
     return;
   } else if (in.min().has_date_val()) {
     DCHECK(out->min().has_date_val());
     DateMinMaxFilter::Or(in, out);
     return;
   } else if (in.min().has_decimal_val()) {
     DCHECK(out->min().has_decimal_val());
     DecimalMinMaxFilter::Or(in, out, columnType.precision);
     return;
   }
   DCHECK(false) << "Unsupported MinMaxFilter type.";
 }

 void MinMaxFilter::Copy(const MinMaxFilterPB& in, MinMaxFilterPB* out) {
   out->set_always_false(in.always_false());
   out->set_always_true(in.always_true());
   if (in.always_false() || in.always_true()) return;
   if (in.min().has_bool_val()) {
     DCHECK(!out->min().has_bool_val());
     BoolMinMaxFilter::Copy(in, out);
     return;
   } else if (in.min().has_byte_val()) {
     DCHECK(!out->min().has_byte_val());
     TinyIntMinMaxFilter::Copy(in, out);
     return;
   } else if (in.min().has_short_val()) {
     DCHECK(!out->min().has_short_val());
     SmallIntMinMaxFilter::Copy(in, out);
     return;
   } else if (in.min().has_int_val()) {
     DCHECK(!out->min().has_int_val());
     IntMinMaxFilter::Copy(in, out);
     return;
   } else if (in.min().has_long_val()) {
     // Handles TimestampMinMaxFilter also as ColumnValuePB doesn't have a timestamp type.
     DCHECK(!out->min().has_long_val());
     BigIntMinMaxFilter::Copy(in, out);
     return;
   } else if (in.min().has_double_val()) {
     // Handles FloatMinMaxFilter also as ColumnValuePB doesn't have a float type.
     DCHECK(!out->min().has_double_val());
     DoubleMinMaxFilter::Copy(in, out);
     return;
   } else if (in.min().has_string_val()) {
     DCHECK(!out->min().has_string_val());
     StringMinMaxFilter::Copy(in, out);
     return;
   } else if (in.min().has_timestamp_val()) {
     DCHECK(!out->min().has_timestamp_val());
     TimestampMinMaxFilter::Copy(in, out);
     return;
   } else if (in.min().has_date_val()) {
     DCHECK(!out->min().has_date_val());
     DateMinMaxFilter::Copy(in, out);
     return;
   } else if (in.min().has_decimal_val()) {
     DCHECK(!out->min().has_decimal_val());
     DecimalMinMaxFilter::Copy(in, out);
     return;
   }
   DCHECK(false) << "Unsupported MinMaxFilter type.";
 }

 string MinMaxFilter::DebugString(const ColumnValuePB& v, const ColumnType& col_type) {
   std::stringstream ss;
   if (v.has_string_val()) {
     ss << v.string_val();
   } else if (v.has_binary_val()) {
     ss << v.binary_val();
   } else if (v.has_timestamp_val()) {
     ss << TimestampValue::FromColumnValuePB(v);
   } else if (v.has_decimal_val()) {
     double d = 0.0;
     switch (col_type.GetByteSize()) {
       case 4:
         d = Decimal4Value::FromColumnValuePB(v).ToDouble(col_type.scale);
         break;
       case 8:
         d = Decimal8Value::FromColumnValuePB(v).ToDouble(col_type.scale);
         break;
       case 16:
         d = Decimal16Value::FromColumnValuePB(v).ToDouble(col_type.scale);
         break;
       default:
         DCHECK(false) << "Unknown byte size for decimal.";
     }
     ss << d;
   } else if (v.has_bool_val()) {
     ss << v.bool_val();
   } else if (v.has_int_val()) {
     ss << v.int_val();
   } else if (v.has_long_val()) {
     ss << v.long_val();
   } else if (v.has_double_val()) {
     ss << v.double_val();
   } else if (v.has_byte_val()) {
     ss << v.byte_val();
   } else if (v.has_short_val()) {
     ss << v.short_val();
   } else if (v.has_date_val()) {
     ss << DateValue::FromColumnValuePB(v).ToString();
   }
   return ss.str();
 }

 string MinMaxFilter::DebugString(
     const MinMaxFilterPB& filter, const ColumnType& col_type) {
   std::stringstream ss;
   bool always_true = filter.has_always_true() && filter.always_true();
   bool always_false = filter.has_always_false() && filter.always_false();
   ss << "MinmaxFilterPB:"
      << " always_true()=" << always_true
      << ", always_false()=" << always_false;

   if (filter.has_min()) {
     ss << ", min=" << DebugString(filter.min(), col_type);
   } else {
     ss << ", min=N/A";
   }

   if (filter.has_max()) {
     ss << ", max=" << DebugString(filter.max(), col_type);
   } else {
     ss << ", max=N/A";
   }
   return ss.str();
 }

 bool MinMaxFilter::AlwaysTrue(const MinMaxFilterPB& filter) {
   return filter.has_always_true() && filter.always_true();
 }

 bool MinMaxFilter::AlwaysFalse(const MinMaxFilterPB& filter) {
   return filter.has_always_false() && filter.always_false();
 }

 } // namespace impala