integration/spark/src/test/scala/org/apache/carbondata/spark/testsuite/datacompaction/DataCompactionBlockletBoundryTest.scala - carbondata - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one or more
  * contributor license agreements.  See the NOTICE file distributed with
  * this work for additional information regarding copyright ownership.
  * The ASF licenses this file to You under the Apache License, Version 2.0
  * (the "License"); you may not use this file except in compliance with
  * the License.  You may obtain a copy of the License at
  *
  *    http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
 package org.apache.carbondata.spark.testsuite.datacompaction

 import org.scalatest.BeforeAndAfterAll

 import org.apache.spark.sql.test.util.QueryTest

 import org.apache.carbondata.core.constants.CarbonCommonConstants
 import org.apache.carbondata.core.util.CarbonProperties

 /**
   * FT for data compaction scenario.
   */
 class DataCompactionBlockletBoundryTest extends QueryTest with BeforeAndAfterAll {

   override def beforeAll {
     sql("drop table if exists  blocklettest")
     sql("drop table if exists  Carbon_automation_hive")
     CarbonProperties.getInstance()
       .addProperty(CarbonCommonConstants.CARBON_TIMESTAMP_FORMAT, "mm/dd/yyyy")
     CarbonProperties.getInstance()
       .addProperty(CarbonCommonConstants.BLOCKLET_SIZE,
         "125")
     sql(
       "CREATE TABLE IF NOT EXISTS blocklettest (country String, ID String, date Timestamp, name " +
         "String, phonetype String, serialname String, salary Int) STORED AS carbondata"
     )


     val csvFilePath1 = s"$resourcesPath/compaction/compaction1.csv"

     // loading the rows greater than 256. so that the column cardinality crosses byte boundary.
     val csvFilePath2 = s"$resourcesPath/compaction/compactioncard2.csv"


     sql("LOAD DATA LOCAL INPATH '" + csvFilePath1 + "' INTO TABLE blocklettest OPTIONS" +
       "('DELIMITER'= ',', 'QUOTECHAR'= '\"')"
     )
     sql("LOAD DATA LOCAL INPATH '" + csvFilePath2 + "' INTO TABLE blocklettest  OPTIONS" +
       "('DELIMITER'= ',', 'QUOTECHAR'= '\"')"
     )
     // compaction will happen here.
     sql("alter table blocklettest compact 'major'"
     )

     sql(
       "create table Carbon_automation_hive (ID String, date " +
       "Timestamp,country String, name String, phonetype String, serialname String, salary Int ) row format " +
       "delimited fields terminated by ',' TBLPROPERTIES ('skip.header.line.count'='1') "
     )

     sql(s"LOAD DATA LOCAL INPATH '$resourcesPath/compaction/compaction1_forhive.csv" + "' INTO " +
         "table Carbon_automation_hive ")
     sql(s"LOAD DATA LOCAL INPATH '$resourcesPath/compaction/compactioncard2_forhive.csv" + "' INTO " +
         "table Carbon_automation_hive ")

   }

   test("select country,count(*) as a from blocklettest")({
     checkAnswer(
       sql("select country,count(*) as a from blocklettest group by country"),
       sql("select country,count(*) as a from Carbon_automation_hive group by country")
     )
   }
   )

   override def afterAll {
     CarbonProperties.getInstance()
       .addProperty(CarbonCommonConstants.CARBON_TIMESTAMP_FORMAT,
         CarbonCommonConstants.CARBON_TIMESTAMP_DEFAULT_FORMAT)
       .addProperty(CarbonCommonConstants.BLOCKLET_SIZE,
         "" + CarbonCommonConstants.BLOCKLET_SIZE_DEFAULT_VAL)
     sql("drop table if exists  blocklettest")
     sql("drop table if exists  Carbon_automation_hive")
   }

 }
	/*
	* Licensed to the Apache Software Foundation (ASF) under one or more
	* contributor license agreements. See the NOTICE file distributed with
	* this work for additional information regarding copyright ownership.
	* The ASF licenses this file to You under the Apache License, Version 2.0
	* (the "License"); you may not use this file except in compliance with
	* the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/
	package org.apache.carbondata.spark.testsuite.datacompaction

	import org.scalatest.BeforeAndAfterAll

	import org.apache.spark.sql.test.util.QueryTest

	import org.apache.carbondata.core.constants.CarbonCommonConstants
	import org.apache.carbondata.core.util.CarbonProperties

	/**
	* FT for data compaction scenario.
	*/
	class DataCompactionBlockletBoundryTest extends QueryTest with BeforeAndAfterAll {

	override def beforeAll {
	sql("drop table if exists blocklettest")
	sql("drop table if exists Carbon_automation_hive")
	CarbonProperties.getInstance()
	.addProperty(CarbonCommonConstants.CARBON_TIMESTAMP_FORMAT, "mm/dd/yyyy")
	CarbonProperties.getInstance()
	.addProperty(CarbonCommonConstants.BLOCKLET_SIZE,
	"125")
	sql(
	"CREATE TABLE IF NOT EXISTS blocklettest (country String, ID String, date Timestamp, name " +
	"String, phonetype String, serialname String, salary Int) STORED AS carbondata"
	)


	val csvFilePath1 = s"$resourcesPath/compaction/compaction1.csv"

	// loading the rows greater than 256. so that the column cardinality crosses byte boundary.
	val csvFilePath2 = s"$resourcesPath/compaction/compactioncard2.csv"


	sql("LOAD DATA LOCAL INPATH '" + csvFilePath1 + "' INTO TABLE blocklettest OPTIONS" +
	"('DELIMITER'= ',', 'QUOTECHAR'= '\"')"
	)
	sql("LOAD DATA LOCAL INPATH '" + csvFilePath2 + "' INTO TABLE blocklettest OPTIONS" +
	"('DELIMITER'= ',', 'QUOTECHAR'= '\"')"
	)
	// compaction will happen here.
	sql("alter table blocklettest compact 'major'"
	)

	sql(
	"create table Carbon_automation_hive (ID String, date " +
	"Timestamp,country String, name String, phonetype String, serialname String, salary Int ) row format " +
	"delimited fields terminated by ',' TBLPROPERTIES ('skip.header.line.count'='1') "
	)

	sql(s"LOAD DATA LOCAL INPATH '$resourcesPath/compaction/compaction1_forhive.csv" + "' INTO " +
	"table Carbon_automation_hive ")
	sql(s"LOAD DATA LOCAL INPATH '$resourcesPath/compaction/compactioncard2_forhive.csv" + "' INTO " +
	"table Carbon_automation_hive ")

	}

	test("select country,count(*) as a from blocklettest")({
	checkAnswer(
	sql("select country,count(*) as a from blocklettest group by country"),
	sql("select country,count(*) as a from Carbon_automation_hive group by country")
	)
	}
	)

	override def afterAll {
	CarbonProperties.getInstance()
	.addProperty(CarbonCommonConstants.CARBON_TIMESTAMP_FORMAT,
	CarbonCommonConstants.CARBON_TIMESTAMP_DEFAULT_FORMAT)
	.addProperty(CarbonCommonConstants.BLOCKLET_SIZE,
	"" + CarbonCommonConstants.BLOCKLET_SIZE_DEFAULT_VAL)
	sql("drop table if exists blocklettest")
	sql("drop table if exists Carbon_automation_hive")
	}

	}