.test-infra/jenkins/job_LoadTests_ParDo_Java_spark_structured_streaming.groovy - beam - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
  * distributed with this work for additional information
  * regarding copyright ownership.  The ASF licenses this file
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 import CommonTestProperties
 import CronJobBuilder
 import LoadTestsBuilder as loadTestsBuilder
 import PhraseTriggeringPostCommitBuilder
 import InfluxDBCredentialsHelper

 def commonLoadTestConfig = { jobType, isStreaming, datasetName ->
   [
     [
       title          : 'Load test: ParDo 2GB 100 byte records 10 times',
       test           : 'org.apache.beam.sdk.loadtests.ParDoLoadTest',
       runner         : CommonTestProperties.Runner.SPARK_STRUCTURED_STREAMING,
       pipelineOptions: [
         project             : 'apache-beam-testing',
         appName             : "load_tests_Java_SparkStructuredStreaming_${jobType}_ParDo_1",
         tempLocation        : 'gs://temp-storage-for-perf-tests/loadtests',
         publishToBigQuery   : true,
         bigQueryDataset     : datasetName,
         bigQueryTable       : "java_sparkstructuredstreaming_${jobType}_ParDo_1",
         influxMeasurement   : "java_${jobType}_pardo_1",
         publishToInfluxDB   : true,
         sourceOptions       : """
                                 {
                                   "numRecords": 20000000,
                                   "keySizeBytes": 10,
                                   "valueSizeBytes": 90
                                 }
                               """.trim().replaceAll("\\s", ""),
         iterations          : 10,
         numberOfCounters    : 1,
         numberOfCounterOperations: 0,
         streaming           : isStreaming
       ]
     ],
     [
       title          : 'Load test: ParDo 2GB 100 byte records 200  times',
       test           : 'org.apache.beam.sdk.loadtests.ParDoLoadTest',
       runner         : CommonTestProperties.Runner.SPARK_STRUCTURED_STREAMING,
       pipelineOptions: [
         project             : 'apache-beam-testing',
         appName             : "load_tests_Java_SparkStructuredStreaming_${jobType}_ParDo_2",
         tempLocation        : 'gs://temp-storage-for-perf-tests/loadtests',
         publishToBigQuery   : true,
         bigQueryDataset     : datasetName,
         bigQueryTable       : "java_sparkstructuredstreaming_${jobType}_ParDo_2",
         influxMeasurement   : "java_${jobType}_pardo_2",
         publishToInfluxDB   : true,
         sourceOptions       : """
                                 {
                                   "numRecords": 20000000,
                                   "keySizeBytes": 10,
                                   "valueSizeBytes": 90
                                 }
                               """.trim().replaceAll("\\s", ""),
         iterations          : 200,
         numberOfCounters    : 1,
         numberOfCounterOperations: 0,
         streaming           : isStreaming
       ]
     ],
     [

       title          : 'Load test: ParDo 2GB 100 byte records 10 counters',
       test           : 'org.apache.beam.sdk.loadtests.ParDoLoadTest',
       runner         : CommonTestProperties.Runner.SPARK_STRUCTURED_STREAMING,
       pipelineOptions: [
         project             : 'apache-beam-testing',
         appName             : "load_tests_Java_SparkStructuredStreaming_${jobType}_ParDo_3",
         tempLocation        : 'gs://temp-storage-for-perf-tests/loadtests',
         publishToBigQuery   : true,
         bigQueryDataset     : datasetName,
         bigQueryTable       : "java_sparkstructuredstreaming_${jobType}_ParDo_3",
         influxMeasurement   : "java_${jobType}_pardo_3",
         publishToInfluxDB   : true,
         sourceOptions       : """
                                 {
                                   "numRecords": 20000000,
                                   "keySizeBytes": 10,
                                   "valueSizeBytes": 90
                                 }
                               """.trim().replaceAll("\\s", ""),
         iterations          : 1,
         numberOfCounters    : 1,
         numberOfCounterOperations: 10,
         streaming           : isStreaming
       ]

     ],
     [
       title          : 'Load test: ParDo 2GB 100 byte records 100 counters',
       test           : 'org.apache.beam.sdk.loadtests.ParDoLoadTest',
       runner         : CommonTestProperties.Runner.SPARK_STRUCTURED_STREAMING,
       pipelineOptions: [
         project             : 'apache-beam-testing',
         appName             : "load_tests_Java_SparkStructuredStreaming_${jobType}_ParDo_4",
         tempLocation        : 'gs://temp-storage-for-perf-tests/loadtests',
         publishToBigQuery   : true,
         bigQueryDataset     : datasetName,
         bigQueryTable       : "java_sparkstructuredstreaming_${jobType}_ParDo_4",
         influxMeasurement   : "java_${jobType}_pardo_4",
         publishToInfluxDB   : true,
         sourceOptions       : """
                                 {
                                   "numRecords": 20000000,
                                   "keySizeBytes": 10,
                                   "valueSizeBytes": 90
                                 }
                               """.trim().replaceAll("\\s", ""),
         iterations          : 1,
         numberOfCounters    : 1,
         numberOfCounterOperations: 100,
         streaming           : isStreaming
       ]
     ]
   ].each { test -> test.pipelineOptions.putAll(additionalPipelineArgs) }
 }


 def batchLoadTestJob = { scope, triggeringContext ->
   def datasetName = loadTestsBuilder.getBigQueryDataset('load_test', triggeringContext)
   loadTestsBuilder.loadTests(scope, CommonTestProperties.SDK.JAVA, commonLoadTestConfig('batch', false, datasetName), "ParDo", "batch")
 }


 CronJobBuilder.cronJob('beam_LoadTests_Java_ParDo_SparkStructuredStreaming_Batch', 'H 12 * * *', this) {
   additionalPipelineArgs = [
     influxDatabase: InfluxDBCredentialsHelper.InfluxDBDatabaseName,
     influxHost: InfluxDBCredentialsHelper.InfluxDBHostUrl,
   ]
   batchLoadTestJob(delegate, CommonTestProperties.TriggeringContext.POST_COMMIT)
 }


 PhraseTriggeringPostCommitBuilder.postCommitJob(
     'beam_LoadTests_Java_ParDo_SparkStructuredStreaming_Batch',
     'Run Load Tests Java ParDo SparkStructuredStreaming Batch',
     'Load Tests Java ParDo SparkStructuredStreaming Batch suite',
     this
     ) {
       additionalPipelineArgs = [:]
       batchLoadTestJob(delegate, CommonTestProperties.TriggeringContext.PR)
     }
	/*
	* Licensed to the Apache Software Foundation (ASF) under one
	* or more contributor license agreements. See the NOTICE file
	* distributed with this work for additional information
	* regarding copyright ownership. The ASF licenses this file
	* to you under the Apache License, Version 2.0 (the
	* "License"); you may not use this file except in compliance
	* with the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	import CommonTestProperties
	import CronJobBuilder
	import LoadTestsBuilder as loadTestsBuilder
	import PhraseTriggeringPostCommitBuilder
	import InfluxDBCredentialsHelper

	def commonLoadTestConfig = { jobType, isStreaming, datasetName ->
	[
	[
	title : 'Load test: ParDo 2GB 100 byte records 10 times',
	test : 'org.apache.beam.sdk.loadtests.ParDoLoadTest',
	runner : CommonTestProperties.Runner.SPARK_STRUCTURED_STREAMING,
	pipelineOptions: [
	project : 'apache-beam-testing',
	appName : "load_tests_Java_SparkStructuredStreaming_${jobType}_ParDo_1",
	tempLocation : 'gs://temp-storage-for-perf-tests/loadtests',
	publishToBigQuery : true,
	bigQueryDataset : datasetName,
	bigQueryTable : "java_sparkstructuredstreaming_${jobType}_ParDo_1",
	influxMeasurement : "java_${jobType}_pardo_1",
	publishToInfluxDB : true,
	sourceOptions : """
	{
	"numRecords": 20000000,
	"keySizeBytes": 10,
	"valueSizeBytes": 90
	}
	""".trim().replaceAll("\\s", ""),
	iterations : 10,
	numberOfCounters : 1,
	numberOfCounterOperations: 0,
	streaming : isStreaming
	]
	],
	[
	title : 'Load test: ParDo 2GB 100 byte records 200 times',
	test : 'org.apache.beam.sdk.loadtests.ParDoLoadTest',
	runner : CommonTestProperties.Runner.SPARK_STRUCTURED_STREAMING,
	pipelineOptions: [
	project : 'apache-beam-testing',
	appName : "load_tests_Java_SparkStructuredStreaming_${jobType}_ParDo_2",
	tempLocation : 'gs://temp-storage-for-perf-tests/loadtests',
	publishToBigQuery : true,
	bigQueryDataset : datasetName,
	bigQueryTable : "java_sparkstructuredstreaming_${jobType}_ParDo_2",
	influxMeasurement : "java_${jobType}_pardo_2",
	publishToInfluxDB : true,
	sourceOptions : """
	{
	"numRecords": 20000000,
	"keySizeBytes": 10,
	"valueSizeBytes": 90
	}
	""".trim().replaceAll("\\s", ""),
	iterations : 200,
	numberOfCounters : 1,
	numberOfCounterOperations: 0,
	streaming : isStreaming
	]
	],
	[

	title : 'Load test: ParDo 2GB 100 byte records 10 counters',
	test : 'org.apache.beam.sdk.loadtests.ParDoLoadTest',
	runner : CommonTestProperties.Runner.SPARK_STRUCTURED_STREAMING,
	pipelineOptions: [
	project : 'apache-beam-testing',
	appName : "load_tests_Java_SparkStructuredStreaming_${jobType}_ParDo_3",
	tempLocation : 'gs://temp-storage-for-perf-tests/loadtests',
	publishToBigQuery : true,
	bigQueryDataset : datasetName,
	bigQueryTable : "java_sparkstructuredstreaming_${jobType}_ParDo_3",
	influxMeasurement : "java_${jobType}_pardo_3",
	publishToInfluxDB : true,
	sourceOptions : """
	{
	"numRecords": 20000000,
	"keySizeBytes": 10,
	"valueSizeBytes": 90
	}
	""".trim().replaceAll("\\s", ""),
	iterations : 1,
	numberOfCounters : 1,
	numberOfCounterOperations: 10,
	streaming : isStreaming
	]

	],
	[
	title : 'Load test: ParDo 2GB 100 byte records 100 counters',
	test : 'org.apache.beam.sdk.loadtests.ParDoLoadTest',
	runner : CommonTestProperties.Runner.SPARK_STRUCTURED_STREAMING,
	pipelineOptions: [
	project : 'apache-beam-testing',
	appName : "load_tests_Java_SparkStructuredStreaming_${jobType}_ParDo_4",
	tempLocation : 'gs://temp-storage-for-perf-tests/loadtests',
	publishToBigQuery : true,
	bigQueryDataset : datasetName,
	bigQueryTable : "java_sparkstructuredstreaming_${jobType}_ParDo_4",
	influxMeasurement : "java_${jobType}_pardo_4",
	publishToInfluxDB : true,
	sourceOptions : """
	{
	"numRecords": 20000000,
	"keySizeBytes": 10,
	"valueSizeBytes": 90
	}
	""".trim().replaceAll("\\s", ""),
	iterations : 1,
	numberOfCounters : 1,
	numberOfCounterOperations: 100,
	streaming : isStreaming
	]
	]
	].each { test -> test.pipelineOptions.putAll(additionalPipelineArgs) }
	}


	def batchLoadTestJob = { scope, triggeringContext ->
	def datasetName = loadTestsBuilder.getBigQueryDataset('load_test', triggeringContext)
	loadTestsBuilder.loadTests(scope, CommonTestProperties.SDK.JAVA, commonLoadTestConfig('batch', false, datasetName), "ParDo", "batch")
	}


	CronJobBuilder.cronJob('beam_LoadTests_Java_ParDo_SparkStructuredStreaming_Batch', 'H 12 * * *', this) {
	additionalPipelineArgs = [
	influxDatabase: InfluxDBCredentialsHelper.InfluxDBDatabaseName,
	influxHost: InfluxDBCredentialsHelper.InfluxDBHostUrl,
	]
	batchLoadTestJob(delegate, CommonTestProperties.TriggeringContext.POST_COMMIT)
	}


	PhraseTriggeringPostCommitBuilder.postCommitJob(
	'beam_LoadTests_Java_ParDo_SparkStructuredStreaming_Batch',
	'Run Load Tests Java ParDo SparkStructuredStreaming Batch',
	'Load Tests Java ParDo SparkStructuredStreaming Batch suite',
	this
	) {
	additionalPipelineArgs = [:]
	batchLoadTestJob(delegate, CommonTestProperties.TriggeringContext.PR)
	}