integration/spark/src/main/scala/org/apache/spark/sql/optimizer/CarbonOptimizer.scala - carbondata - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one or more
  * contributor license agreements.  See the NOTICE file distributed with
  * this work for additional information regarding copyright ownership.
  * The ASF licenses this file to You under the Apache License, Version 2.0
  * (the "License"); you may not use this file except in compliance with
  * the License.  You may obtain a copy of the License at
  *
  *    http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 package org.apache.spark.sql.optimizer

 import java.util

 import scala.collection.JavaConverters._
 import scala.collection.mutable.ArrayBuffer

 import org.apache.spark.sql._
 import org.apache.spark.sql.catalyst.CarbonTableIdentifierImplicit._
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.expressions.aggregate._
 import org.apache.spark.sql.catalyst.optimizer.Optimizer
 import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.execution.command.ProjectForUpdateCommand
 import org.apache.spark.sql.execution.RunnableCommand
 import org.apache.spark.sql.execution.datasources.LogicalRelation
 import org.apache.spark.sql.types.{IntegerType, StringType}

 import org.apache.carbondata.common.logging.LogServiceFactory
 import org.apache.carbondata.core.constants.CarbonCommonConstants
 import org.apache.carbondata.core.stats.QueryStatistic
 import org.apache.carbondata.core.util.CarbonTimeStatisticsFactory
 import org.apache.carbondata.spark.{CarbonAliasDecoderRelation, CarbonFilters}

 /**
  * Carbon Optimizer to add dictionary decoder.
  */
 object CarbonOptimizer {

   def optimizer(optimizer: Optimizer, conf: CarbonSQLConf, version: String): Optimizer = {
     CodeGenerateFactory.getInstance().optimizerFactory.createOptimizer(optimizer, conf)
   }

   def execute(plan: LogicalPlan, optimizer: Optimizer): LogicalPlan = {
     val executedPlan: LogicalPlan = optimizer.execute(plan)
     val relations = CarbonOptimizer.collectCarbonRelation(plan)
     if (relations.nonEmpty) {
       new ResolveCarbonFunctions(relations).apply(executedPlan)
     } else {
       executedPlan
     }
   }

   // get the carbon relation from plan.
   def collectCarbonRelation(plan: LogicalPlan): Seq[CarbonDecoderRelation] = {
     plan collect {
       case l: LogicalRelation if l.relation.isInstanceOf[CarbonDatasourceRelation] =>
         CarbonDecoderRelation(l.attributeMap, l.relation.asInstanceOf[CarbonDatasourceRelation])
     }
   }
 }

 /**
  * It does two jobs. 1. Change the datatype for dictionary encoded column 2. Add the dictionary
  * decoder plan.
  */
 class ResolveCarbonFunctions(relations: Seq[CarbonDecoderRelation])
   extends Rule[LogicalPlan] with PredicateHelper {
   val LOGGER = LogServiceFactory.getLogService(this.getClass.getName)
   def apply(logicalPlan: LogicalPlan): LogicalPlan = {
     if (relations.nonEmpty && !isOptimized(logicalPlan)) {
       val plan = processPlan(logicalPlan)
       val udfTransformedPlan = pushDownUDFToJoinLeftRelation(plan)
       LOGGER.info("Starting to optimize plan")
       val recorder = CarbonTimeStatisticsFactory.createExecutorRecorder("")
       val queryStatistic = new QueryStatistic()
       val result = transformCarbonPlan(udfTransformedPlan, relations)
       queryStatistic.addStatistics("Time taken for Carbon Optimizer to optimize: ",
         System.currentTimeMillis)
       recorder.recordStatistics(queryStatistic)
       recorder.logStatistics()
       result
     } else {
       LOGGER.info("Skip CarbonOptimizer")
       logicalPlan
     }
   }

   private def processPlan(plan: LogicalPlan): LogicalPlan = {
     plan transform {
       case ProjectForUpdate(table, cols, Seq(updatePlan)) =>
         var isTransformed = false
         val newPlan = updatePlan transform {
           case Project(pList, child) if (!isTransformed) =>
             val (dest: Seq[NamedExpression], source: Seq[NamedExpression]) = pList
               .splitAt(pList.size - cols.size)
             val diff = cols.diff(dest.map(_.name))
             if (diff.size > 0) {
               sys.error(s"Unknown column(s) ${diff.mkString(",")} in table ${table.tableName}")
             }
             isTransformed = true
             Project(dest.filter(a => !cols.contains(a.name)) ++ source, child)
         }
         ProjectForUpdateCommand(newPlan, table.tableIdentifier)
     }
   }
   private def pushDownUDFToJoinLeftRelation(plan: LogicalPlan): LogicalPlan = {
     val output = plan match {
       case proj@Project(cols, Join(
       left, right, jointype: org.apache.spark.sql.catalyst.plans.JoinType, condition)) =>
         var projectionToBeAdded: Seq[org.apache.spark.sql.catalyst.expressions.Alias] = Seq.empty
         val newCols = cols.map { col =>
           col match {
             case a@Alias(s: ScalaUDF, name)
               if (name.equalsIgnoreCase(CarbonCommonConstants.POSITION_ID) ||
                   name.equalsIgnoreCase(
                     CarbonCommonConstants.CARBON_IMPLICIT_COLUMN_TUPLEID)) =>
               projectionToBeAdded :+= a
               AttributeReference(name, StringType, true)().withExprId(a.exprId)
             case other => other
           }
         }
         val newLeft = left match {
           case Project(columns, logicalPlan) =>
             Project(columns ++ projectionToBeAdded, logicalPlan)
           case filter: Filter =>
             Project(filter.output ++ projectionToBeAdded, filter)
           case other => other
         }
         Project(newCols, Join(newLeft, right, jointype, condition))
       case other => other
     }
     output
   }
   def isOptimized(plan: LogicalPlan): Boolean = {
     plan find {
       case cd: CarbonDictionaryCatalystDecoder => true
       case ic: InsertIntoCarbonTable => true
       case other => false
     } isDefined
   }

   case class ExtraNodeInfo(var hasCarbonRelation: Boolean)

   def fillNodeInfo(
       plan: LogicalPlan,
       extraNodeInfos: java.util.HashMap[LogicalPlan, ExtraNodeInfo]): ExtraNodeInfo = {
     plan match {
       case l: LogicalRelation if l.relation.isInstanceOf[CarbonDatasourceRelation] =>
         val extraNodeInfo = ExtraNodeInfo(true)
         extraNodeInfo
       case others =>
         val extraNodeInfo = ExtraNodeInfo(false)
         others.children.foreach { childPlan =>
           val childExtraNodeInfo = fillNodeInfo(childPlan, extraNodeInfos)
           if (childExtraNodeInfo.hasCarbonRelation) {
             extraNodeInfo.hasCarbonRelation = true
           }
         }
         // only put no carbon realtion plan
         if (!extraNodeInfo.hasCarbonRelation) {
           extraNodeInfos.put(plan, extraNodeInfo)
         }
         extraNodeInfo
     }
   }

   /**
    * Steps for changing the plan.
    * 1. It finds out the join condition columns and dimension aggregate columns which are need to
    * be decoded just before that plan executes.
    * 2. Plan starts transform by adding the decoder to the plan where it needs the decoded data
    * like dimension aggregate columns decoder under aggregator and join condition decoder under
    * join children.
    */
   def transformCarbonPlan(plan: LogicalPlan,
       relations: Seq[CarbonDecoderRelation]): LogicalPlan = {
     if (plan.isInstanceOf[RunnableCommand]) {
       return plan
     }
     var decoder = false
     val mapOfNonCarbonPlanNodes = new java.util.HashMap[LogicalPlan, ExtraNodeInfo]
     fillNodeInfo(plan, mapOfNonCarbonPlanNodes)
     val aliasMap = CarbonAliasDecoderRelation()
     // collect alias information before hand.
     collectInformationOnAttributes(plan, aliasMap)

     def hasCarbonRelation(currentPlan: LogicalPlan): Boolean = {
       val extraNodeInfo = mapOfNonCarbonPlanNodes.get(currentPlan)
       if (extraNodeInfo == null) {
         true
       } else {
         extraNodeInfo.hasCarbonRelation
       }
     }

     val attrMap = new util.HashMap[AttributeReferenceWrapper, CarbonDecoderRelation]()
     relations.foreach(_.fillAttributeMap(attrMap))

     def addTempDecoder(currentPlan: LogicalPlan): LogicalPlan = {

       def transformAggregateExpression(agg: Aggregate,
           aggonGroups: util.HashSet[AttributeReferenceWrapper] = null): LogicalPlan = {
         val attrsOndimAggs = new util.HashSet[AttributeReferenceWrapper]
         if (aggonGroups != null) {
           attrsOndimAggs.addAll(aggonGroups)
         }
         agg.aggregateExpressions.map {
           case attr: AttributeReference =>
           case a@Alias(attr: AttributeReference, name) =>
           case aggExp: AggregateExpression =>
             aggExp.transform {
               case aggExp: AggregateExpression =>
                 collectDimensionAggregates(aggExp, attrsOndimAggs, aliasMap, attrMap)
                 aggExp
             }
           case others =>
             others.collect {
               case attr: AttributeReference
                 if isDictionaryEncoded(attr, attrMap, aliasMap) =>
                 attrsOndimAggs.add(AttributeReferenceWrapper(aliasMap.getOrElse(attr, attr)))
             }
         }
         var child = agg.child
         // Incase if the child also aggregate then push down decoder to child
         if (attrsOndimAggs.size() > 0 && !child.equals(agg)) {
           child = CarbonDictionaryTempDecoder(attrsOndimAggs,
             new util.HashSet[AttributeReferenceWrapper](),
             agg.child)
         }
         if (!decoder && aggonGroups == null) {
           decoder = true
           CarbonDictionaryTempDecoder(new util.HashSet[AttributeReferenceWrapper](),
             new util.HashSet[AttributeReferenceWrapper](),
             Aggregate(agg.groupingExpressions, agg.aggregateExpressions, child),
             isOuter = true)
         } else {
           Aggregate(agg.groupingExpressions, agg.aggregateExpressions, child)
         }
       }

       currentPlan match {
         case limit@Limit(_, child: Sort) =>
           if (!decoder) {
             decoder = true
             CarbonDictionaryTempDecoder(new util.HashSet[AttributeReferenceWrapper](),
               new util.HashSet[AttributeReferenceWrapper](),
               limit,
               isOuter = true)
           } else {
             limit
           }
         case sort: Sort if !sort.child.isInstanceOf[CarbonDictionaryTempDecoder] =>
           val attrsOnSort = new util.HashSet[AttributeReferenceWrapper]()
           sort.order.map { s =>
             s.collect {
               case attr: AttributeReference
                 if isDictionaryEncoded(attr, attrMap, aliasMap) =>
                 attrsOnSort.add(AttributeReferenceWrapper(aliasMap.getOrElse(attr, attr)))
             }
           }
           var child = sort.child
           if (attrsOnSort.size() > 0 && !child.isInstanceOf[Sort]) {
             child = CarbonDictionaryTempDecoder(attrsOnSort,
               new util.HashSet[AttributeReferenceWrapper](), sort.child)
           }
           if (!decoder) {
             decoder = true
             CarbonDictionaryTempDecoder(new util.HashSet[AttributeReferenceWrapper](),
               new util.HashSet[AttributeReferenceWrapper](),
               Sort(sort.order, sort.global, child),
               isOuter = true)
           } else {
             Sort(sort.order, sort.global, child)
           }

         case union: Union
           if !(union.left.isInstanceOf[CarbonDictionaryTempDecoder] ||
                union.right.isInstanceOf[CarbonDictionaryTempDecoder]) =>
           val leftCondAttrs = new util.HashSet[AttributeReferenceWrapper]
           val rightCondAttrs = new util.HashSet[AttributeReferenceWrapper]
           val leftLocalAliasMap = CarbonAliasDecoderRelation()
           val rightLocalAliasMap = CarbonAliasDecoderRelation()
           // collect alias information for the child plan again. It is required as global alias
           // may have duplicated in case of aliases
           collectInformationOnAttributes(union.left, leftLocalAliasMap)
           collectInformationOnAttributes(union.right, rightLocalAliasMap)
           union.left.output.foreach { attr =>
             if (isDictionaryEncoded(attr, attrMap, leftLocalAliasMap)) {
               leftCondAttrs.add(AttributeReferenceWrapper(leftLocalAliasMap.getOrElse(attr, attr)))
             }
           }
           union.right.output.foreach { attr =>
             if (isDictionaryEncoded(attr, attrMap, rightLocalAliasMap)) {
               rightCondAttrs.add(
                 AttributeReferenceWrapper(rightLocalAliasMap.getOrElse(attr, attr)))
             }
           }
           var leftPlan = union.left
           var rightPlan = union.right
           if (hasCarbonRelation(leftPlan) && leftCondAttrs.size() > 0 &&
               !leftPlan.isInstanceOf[CarbonDictionaryCatalystDecoder]) {
             leftPlan = CarbonDictionaryTempDecoder(leftCondAttrs,
               new util.HashSet[AttributeReferenceWrapper](),
               union.left, isOuter = false, Some(leftLocalAliasMap))
           }
           if (hasCarbonRelation(rightPlan) && rightCondAttrs.size() > 0 &&
               !rightPlan.isInstanceOf[CarbonDictionaryCatalystDecoder]) {
             rightPlan = CarbonDictionaryTempDecoder(rightCondAttrs,
               new util.HashSet[AttributeReferenceWrapper](),
               union.right, isOuter = false, Some(rightLocalAliasMap))
           }
           if (!decoder) {
             decoder = true
             CarbonDictionaryTempDecoder(new util.HashSet[AttributeReferenceWrapper](),
               new util.HashSet[AttributeReferenceWrapper](),
               Union(leftPlan, rightPlan),
               isOuter = true)
           } else {
             Union(leftPlan, rightPlan)
           }

         case agg: Aggregate if !agg.child.isInstanceOf[CarbonDictionaryTempDecoder] =>
           transformAggregateExpression(agg)
         case expand: Expand if !expand.child.isInstanceOf[CarbonDictionaryTempDecoder] =>
           val attrsOnExpand = new util.HashSet[AttributeReferenceWrapper]
           expand.projections.map {s =>
             s.map {
               case attr: AttributeReference =>
               case a@Alias(attr: AttributeReference, name) =>
               case others =>
                 others.collect {
                   case attr: AttributeReference
                     if isDictionaryEncoded(attr, attrMap, aliasMap) =>
                     attrsOnExpand.add(AttributeReferenceWrapper(aliasMap.getOrElse(attr, attr)))
                 }
             }
           }
           var child = expand.child
           if (attrsOnExpand.size() > 0 && !child.isInstanceOf[Expand]) {
             child = CarbonDictionaryTempDecoder(attrsOnExpand,
               new util.HashSet[AttributeReferenceWrapper](),
               expand.child)
           }
           if (!decoder) {
             decoder = true
             CarbonDictionaryTempDecoder(new util.HashSet[AttributeReferenceWrapper](),
               new util.HashSet[AttributeReferenceWrapper](),
               CodeGenerateFactory.getInstance().expandFactory.createExpand(expand, child),
               isOuter = true)
           } else {
             CodeGenerateFactory.getInstance().expandFactory.createExpand(expand, child)
           }
         case filter: Filter if !filter.child.isInstanceOf[CarbonDictionaryTempDecoder] =>
           val attrsOnConds = new util.HashSet[AttributeReferenceWrapper]
           // In case the child is join then we cannot push down the filters so decode them earlier
           if (filter.child.isInstanceOf[Join] || filter.child.isInstanceOf[Sort]) {
             filter.condition.collect {
               case attr: AttributeReference =>
                 attrsOnConds.add(AttributeReferenceWrapper(aliasMap.getOrElse(attr, attr)))
             }
           } else {
             CarbonFilters
               .selectFilters(splitConjunctivePredicates(filter.condition), attrsOnConds, aliasMap)
           }

           var child = filter.child
           if (attrsOnConds.size() > 0 && !child.isInstanceOf[Filter]) {
             child = CarbonDictionaryTempDecoder(attrsOnConds,
               new util.HashSet[AttributeReferenceWrapper](),
               filter.child)
           }

           if (!decoder) {
             decoder = true
             CarbonDictionaryTempDecoder(new util.HashSet[AttributeReferenceWrapper](),
               new util.HashSet[AttributeReferenceWrapper](),
               Filter(filter.condition, child),
               isOuter = true)
           } else {
             Filter(filter.condition, child)
           }

         case j: Join
           if !(j.left.isInstanceOf[CarbonDictionaryTempDecoder] ||
                j.right.isInstanceOf[CarbonDictionaryTempDecoder]) =>
           val attrsOnJoin = new util.HashSet[Attribute]
           j.condition match {
             case Some(expression) =>
               expression.collect {
                 case attr: AttributeReference
                   if isDictionaryEncoded(attr, attrMap, aliasMap) =>
                   attrsOnJoin.add(aliasMap.getOrElse(attr, attr))
               }
             case _ =>
           }

           val leftCondAttrs = new util.HashSet[AttributeReferenceWrapper]
           val rightCondAttrs = new util.HashSet[AttributeReferenceWrapper]
           if (attrsOnJoin.size() > 0) {

             attrsOnJoin.asScala.map { attr =>
               if (qualifierPresence(j.left, attr)) {
                 leftCondAttrs.add(AttributeReferenceWrapper(attr))
               }
               if (qualifierPresence(j.right, attr)) {
                 rightCondAttrs.add(AttributeReferenceWrapper(attr))
               }
             }
             var leftPlan = j.left
             var rightPlan = j.right
             if (leftCondAttrs.size() > 0 &&
                 !leftPlan.isInstanceOf[CarbonDictionaryCatalystDecoder]) {
               leftPlan = leftPlan match {
                 case agg: Aggregate =>
                   CarbonDictionaryTempDecoder(leftCondAttrs,
                     new util.HashSet[AttributeReferenceWrapper](),
                     transformAggregateExpression(agg, leftCondAttrs))
                 case _ =>
                   CarbonDictionaryTempDecoder(leftCondAttrs,
                     new util.HashSet[AttributeReferenceWrapper](),
                     j.left)
               }
             }
             if (rightCondAttrs.size() > 0 &&
                 !rightPlan.isInstanceOf[CarbonDictionaryCatalystDecoder]) {
               rightPlan = rightPlan match {
                 case agg: Aggregate =>
                   CarbonDictionaryTempDecoder(rightCondAttrs,
                     new util.HashSet[AttributeReferenceWrapper](),
                     transformAggregateExpression(agg, rightCondAttrs))
                 case _ =>
                   CarbonDictionaryTempDecoder(rightCondAttrs,
                     new util.HashSet[AttributeReferenceWrapper](),
                     j.right)
               }
             }
             if (!decoder) {
               decoder = true
               CarbonDictionaryTempDecoder(new util.HashSet[AttributeReferenceWrapper](),
                 new util.HashSet[AttributeReferenceWrapper](),
                 Join(leftPlan, rightPlan, j.joinType, j.condition),
                 isOuter = true)
             } else {
               Join(leftPlan, rightPlan, j.joinType, j.condition)
             }
           } else {
             j
           }

         case p: Project
           if relations.nonEmpty && !p.child.isInstanceOf[CarbonDictionaryTempDecoder] =>
           val attrsOnProjects = new util.HashSet[AttributeReferenceWrapper]
           p.projectList.map {
             case attr: AttributeReference =>
             case a@Alias(attr: AttributeReference, name) =>
             case others =>
               others.collect {
                 case attr: AttributeReference
                   if isDictionaryEncoded(attr, attrMap, aliasMap) =>
                   attrsOnProjects.add(AttributeReferenceWrapper(aliasMap.getOrElse(attr, attr)))
               }
           }
           var child = p.child
           if (attrsOnProjects.size() > 0 && !child.isInstanceOf[Project]) {
             child = CarbonDictionaryTempDecoder(attrsOnProjects,
               new util.HashSet[AttributeReferenceWrapper](),
               p.child)
           }
           if (!decoder) {
             decoder = true
             CarbonDictionaryTempDecoder(new util.HashSet[AttributeReferenceWrapper](),
               new util.HashSet[AttributeReferenceWrapper](),
               Project(p.projectList, child),
               isOuter = true)
           } else {
             Project(p.projectList, child)
           }

         case wd: Window if !wd.child.isInstanceOf[CarbonDictionaryTempDecoder] =>
           val attrsOnProjects = new util.HashSet[AttributeReferenceWrapper]
           wd.projectList.map {
             case attr: AttributeReference =>
             case others =>
               others.collect {
                 case attr: AttributeReference
                   if isDictionaryEncoded(attr, attrMap, aliasMap) =>
                   attrsOnProjects.add(AttributeReferenceWrapper(aliasMap.getOrElse(attr, attr)))
               }
           }
           wd.windowExpressions.map { others =>
             others.collect {
               case attr: AttributeReference
                 if isDictionaryEncoded(attr, attrMap, aliasMap) =>
                 attrsOnProjects.add(AttributeReferenceWrapper(aliasMap.getOrElse(attr, attr)))
             }
           }
           wd.partitionSpec.map{
             case attr: AttributeReference =>
             case others =>
               others.collect {
                 case attr: AttributeReference
                   if isDictionaryEncoded(attr, attrMap, aliasMap) =>
                   attrsOnProjects.add(AttributeReferenceWrapper(aliasMap.getOrElse(attr, attr)))
               }
           }
           wd.orderSpec.map { s =>
             s.collect {
               case attr: AttributeReference
                 if isDictionaryEncoded(attr, attrMap, aliasMap) =>
                 attrsOnProjects.add(AttributeReferenceWrapper(aliasMap.getOrElse(attr, attr)))
             }
           }
           wd.partitionSpec.map { s =>
             s.collect {
               case attr: AttributeReference
                 if isDictionaryEncoded(attr, attrMap, aliasMap) =>
                 attrsOnProjects.add(AttributeReferenceWrapper(aliasMap.getOrElse(attr, attr)))
             }
           }
           var child = wd.child
           if (attrsOnProjects.size() > 0 && !child.isInstanceOf[Project]) {
             child = CarbonDictionaryTempDecoder(attrsOnProjects,
               new util.HashSet[AttributeReferenceWrapper](),
               wd.child)
           }
           if (!decoder) {
             decoder = true
             CarbonDictionaryTempDecoder(new util.HashSet[AttributeReferenceWrapper](),
               new util.HashSet[AttributeReferenceWrapper](),
               Window(wd.projectList, wd.windowExpressions, wd.partitionSpec, wd.orderSpec, child),
               isOuter = true)
           } else {
             Window(wd.projectList, wd.windowExpressions, wd.partitionSpec, wd.orderSpec, child)
           }

         case l: LogicalRelation if l.relation.isInstanceOf[CarbonDatasourceRelation] =>
           if (!decoder) {
             decoder = true
             CarbonDictionaryTempDecoder(new util.HashSet[AttributeReferenceWrapper](),
               new util.HashSet[AttributeReferenceWrapper](), l, isOuter = true)
           } else {
             l
           }

         case others => others
       }

     }

     val transFormedPlan =
       plan transformDown {
         case cd: CarbonDictionaryTempDecoder if cd.isOuter =>
           decoder = true
           cd
         case currentPlan =>
           if (hasCarbonRelation(currentPlan)) {
             addTempDecoder(currentPlan)
           } else {
             currentPlan
           }
       }

     val processor = new CarbonDecoderProcessor
     processor.updateDecoders(processor.getDecoderList(transFormedPlan))
     updateProjection(updateTempDecoder(transFormedPlan, aliasMap, attrMap))
   }

   private def updateTempDecoder(plan: LogicalPlan,
       aliasMapOriginal: CarbonAliasDecoderRelation,
       attrMap: java.util.HashMap[AttributeReferenceWrapper, CarbonDecoderRelation]):
   LogicalPlan = {
     var allAttrsNotDecode: util.Set[AttributeReferenceWrapper] =
       new util.HashSet[AttributeReferenceWrapper]()
     val marker = new CarbonPlanMarker
     var aliasMap = aliasMapOriginal
     plan transformDown {
       case cd: CarbonDictionaryTempDecoder if !cd.processed =>
         cd.processed = true
         allAttrsNotDecode = cd.attrsNotDecode
         aliasMap = cd.aliasMap.getOrElse(aliasMap)
         marker.pushMarker(allAttrsNotDecode)
         if (cd.isOuter) {
           CarbonDictionaryCatalystDecoder(relations,
             ExcludeProfile(cd.getAttrsNotDecode.asScala.toSeq),
             aliasMap,
             isOuter = true,
             cd.child)
         } else {
           CarbonDictionaryCatalystDecoder(relations,
             IncludeProfile(cd.getAttrList.asScala.toSeq),
             aliasMap,
             isOuter = false,
             cd.child)
         }
       case cd: CarbonDictionaryCatalystDecoder =>
         cd
       case sort: Sort =>
         val sortExprs = sort.order.map { s =>
           s.transform {
             case attr: AttributeReference =>
               updateDataType(attr, attrMap, allAttrsNotDecode, aliasMap)
           }.asInstanceOf[SortOrder]
         }
         Sort(sortExprs, sort.global, sort.child)
       case agg: Aggregate if !agg.child.isInstanceOf[CarbonDictionaryCatalystDecoder] =>
         val aggExps = agg.aggregateExpressions.map { aggExp =>
           aggExp.transform {
             case attr: AttributeReference =>
               updateDataType(attr, attrMap, allAttrsNotDecode, aliasMap)
           }
         }.asInstanceOf[Seq[NamedExpression]]

         val grpExps = agg.groupingExpressions.map { gexp =>
           gexp.transform {
             case attr: AttributeReference =>
               updateDataType(attr, attrMap, allAttrsNotDecode, aliasMap)
           }
         }
         Aggregate(grpExps, aggExps, agg.child)
       case expand: Expand =>
         expand.transformExpressions {
           case attr: AttributeReference =>
             updateDataType(attr, attrMap, allAttrsNotDecode, aliasMap)
         }
       case filter: Filter =>
         val filterExps = filter.condition transform {
           case attr: AttributeReference =>
             updateDataType(attr, attrMap, allAttrsNotDecode, aliasMap)
         }
         Filter(filterExps, filter.child)
       case j: Join =>
         marker.pushBinaryMarker(allAttrsNotDecode)
         j
       case u: Union =>
         marker.pushBinaryMarker(allAttrsNotDecode)
         u
       case p: Project if relations.nonEmpty =>
         val prExps = p.projectList.map { prExp =>
           prExp.transform {
             case attr: AttributeReference =>
               updateDataType(attr, attrMap, allAttrsNotDecode, aliasMap)
           }
         }.asInstanceOf[Seq[NamedExpression]]
         Project(prExps, p.child)
       case wd: Window if relations.nonEmpty =>
         val prExps = wd.projectList.map { prExp =>
           prExp.transform {
             case attr: AttributeReference =>
               updateDataType(attr, attrMap, allAttrsNotDecode, aliasMap)
           }
         }.asInstanceOf[Seq[Attribute]]
         val wdExps = wd.windowExpressions.map { gexp =>
           gexp.transform {
             case attr: AttributeReference =>
               updateDataType(attr, attrMap, allAttrsNotDecode, aliasMap)
           }
         }.asInstanceOf[Seq[NamedExpression]]
         val partitionSpec = wd.partitionSpec.map{ exp =>
           exp.transform {
             case attr: AttributeReference =>
               updateDataType(attr, attrMap, allAttrsNotDecode, aliasMap)
           }
         }
         val orderSpec = wd.orderSpec.map { exp =>
           exp.transform {
             case attr: AttributeReference =>
               updateDataType(attr, attrMap, allAttrsNotDecode, aliasMap)
           }
         }.asInstanceOf[Seq[SortOrder]]
         Window(prExps, wdExps, partitionSpec, orderSpec, wd.child)

       case l: LogicalRelation if l.relation.isInstanceOf[CarbonDatasourceRelation] =>
         allAttrsNotDecode = marker.revokeJoin()
         l
       case others => others
     }
   }

   private def updateProjection(plan: LogicalPlan): LogicalPlan = {
     val transFormedPlan = plan transform {
       case p@Project(projectList: Seq[NamedExpression], cd: CarbonDictionaryCatalystDecoder) =>
         if (cd.child.isInstanceOf[Filter] || cd.child.isInstanceOf[LogicalRelation]) {
           Project(projectList: Seq[NamedExpression], cd.child)
         } else {
           p
         }
       case f@Filter(condition: Expression, cd: CarbonDictionaryCatalystDecoder) =>
         if (cd.child.isInstanceOf[Project] || cd.child.isInstanceOf[LogicalRelation]) {
           Filter(condition, cd.child)
         } else {
           f
         }
     }
     // Remove unnecessary decoders
     val finalPlan = transFormedPlan transform {
       case CarbonDictionaryCatalystDecoder(_, profile, _, false, child)
         if profile.isInstanceOf[IncludeProfile] && profile.isEmpty =>
         child
     }
     val updateDtrFn = finalPlan transform {
       case p@Project(projectList: Seq[NamedExpression], cd) =>
         if (cd.isInstanceOf[Filter] || cd.isInstanceOf[LogicalRelation]) {
           p.transformAllExpressions {
             case a@Alias(exp, _)
               if !exp.deterministic && !exp.isInstanceOf[CustomDeterministicExpression] =>
               Alias(CustomDeterministicExpression(exp), a.name)(a.exprId, a.qualifiers,
                 a.explicitMetadata)
             case exp: NamedExpression
               if !exp.deterministic && !exp.isInstanceOf[CustomDeterministicExpression] =>
               CustomDeterministicExpression(exp)
           }
         } else {
           p
         }
       case f@Filter(condition: Expression, cd) =>
         if (cd.isInstanceOf[Project] || cd.isInstanceOf[LogicalRelation]) {
           f.transformAllExpressions {
             case a@Alias(exp, _)
               if !exp.deterministic && !exp.isInstanceOf[CustomDeterministicExpression] =>
               Alias(CustomDeterministicExpression(exp), a.name)(a.exprId, a.qualifiers,
                 a.explicitMetadata)
             case exp: NamedExpression
               if !exp.deterministic && !exp.isInstanceOf[CustomDeterministicExpression] =>
               CustomDeterministicExpression(exp)
           }
         } else {
           f
         }
     }

     updateDtrFn
   }

   private def collectInformationOnAttributes(plan: LogicalPlan,
       aliasMap: CarbonAliasDecoderRelation) {
     plan transformAllExpressions  {
       case a@Alias(exp, name) =>
         exp match {
           case attr: Attribute => aliasMap.put(a.toAttribute, attr)
           case _ => aliasMap.put(a.toAttribute, AttributeReference("", StringType)())
         }
         a
     }
     // collect the output of expand and add projections attributes as alias to it.
     plan.collect {
       case expand: Expand =>
         expand.projections.foreach {s =>
           s.zipWithIndex.foreach { f =>
             f._1 match {
               case attr: AttributeReference =>
                 aliasMap.put(expand.output(f._2).toAttribute, attr)
               case a@Alias(attr: AttributeReference, name) =>
                 aliasMap.put(expand.output(f._2).toAttribute, attr)
               case others =>
             }
           }
         }
     }
   }

   // Collect aggregates on dimensions so that we can add decoder to it.
   private def collectDimensionAggregates(aggExp: AggregateExpression,
       attrsOndimAggs: util.HashSet[AttributeReferenceWrapper],
       aliasMap: CarbonAliasDecoderRelation,
       attrMap: java.util.HashMap[AttributeReferenceWrapper, CarbonDecoderRelation]) {
     aggExp collect {
       case attr: AttributeReference if isDictionaryEncoded(attr, attrMap, aliasMap) =>
         attrsOndimAggs.add(AttributeReferenceWrapper(aliasMap.getOrElse(attr, attr)))
     }
   }

   /**
    * Update the attribute datatype with [IntegerType] if the carbon column is encoded with
    * dictionary.
    *
    */
   private def updateDataType(attr: Attribute,
       attrMap: java.util.HashMap[AttributeReferenceWrapper, CarbonDecoderRelation],
       allAttrsNotDecode: java.util.Set[AttributeReferenceWrapper],
       aliasMap: CarbonAliasDecoderRelation): Attribute = {
     val uAttr = aliasMap.getOrElse(attr, attr)
     val relation = Option(attrMap.get(AttributeReferenceWrapper(uAttr)))
     if (relation.isDefined) {
       relation.get.dictionaryMap.get(uAttr.name) match {
         case Some(true)
           if !allAttrsNotDecode.contains(AttributeReferenceWrapper(uAttr)) =>
           val newAttr = AttributeReference(attr.name,
             IntegerType,
             attr.nullable,
             attr.metadata)(attr.exprId, attr.qualifiers)
           newAttr
         case _ => attr
       }
     } else {
       attr
     }
   }

   private def isDictionaryEncoded(attr: Attribute,
       attrMap: java.util.HashMap[AttributeReferenceWrapper, CarbonDecoderRelation],
       aliasMap: CarbonAliasDecoderRelation): Boolean = {
     val uAttr = aliasMap.getOrElse(attr, attr)
     val relation = Option(attrMap.get(AttributeReferenceWrapper(uAttr)))
     if (relation.isDefined) {
       relation.get.dictionaryMap.get(uAttr.name) match {
         case Some(true) => true
         case _ => false
       }
     } else {
       false
     }
   }

   def qualifierPresence(plan: LogicalPlan, attr: Attribute): Boolean = {
     var present = false
     plan collect {
       case l: LogicalRelation if l.attributeMap.contains(attr) =>
         present = true
     }
     present
   }
 }

 case class CarbonDecoderRelation(
     attributeMap: AttributeMap[AttributeReference],
     carbonRelation: CarbonDatasourceRelation) {

   val extraAttrs = new ArrayBuffer[Attribute]()

   def addAttribute(attr: Attribute): Unit = {
     extraAttrs += attr
   }

   def contains(attr: Attribute): Boolean = {
     val exists =
       attributeMap.exists(entry => entry._1.name.equalsIgnoreCase(attr.name) &&
                                    entry._1.exprId.equals(attr.exprId)) ||
       extraAttrs.exists(entry => entry.name.equalsIgnoreCase(attr.name) &&
                                  entry.exprId.equals(attr.exprId))
     exists
   }

   def fillAttributeMap(attrMap: java.util.HashMap[AttributeReferenceWrapper,
     CarbonDecoderRelation]): Unit = {
     attributeMap.foreach { attr =>
       attrMap.put(AttributeReferenceWrapper(attr._1), this)
     }
   }

   lazy val dictionaryMap = carbonRelation.carbonRelation.metaData.dictionaryMap
 }