blob: 2b973208d4639acf0248fa969ff5dd514ba3ce92 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
import CommonTestProperties
import CronJobBuilder
import LoadTestsBuilder as loadTestsBuilder
import PhraseTriggeringPostCommitBuilder
import InfluxDBCredentialsHelper
def commonLoadTestConfig = { jobType, isStreaming, datasetName ->
[
[
title : 'Load test: ParDo 2GB 100 byte records 10 times',
test : 'org.apache.beam.sdk.loadtests.ParDoLoadTest',
runner : CommonTestProperties.Runner.SPARK_STRUCTURED_STREAMING,
pipelineOptions: [
project : 'apache-beam-testing',
appName : "load_tests_Java_SparkStructuredStreaming_${jobType}_ParDo_1",
tempLocation : 'gs://temp-storage-for-perf-tests/loadtests',
publishToBigQuery : true,
bigQueryDataset : datasetName,
bigQueryTable : "java_sparkstructuredstreaming_${jobType}_ParDo_1",
influxMeasurement : "java_${jobType}_pardo_1",
publishToInfluxDB : true,
sourceOptions : """
{
"numRecords": 20000000,
"keySizeBytes": 10,
"valueSizeBytes": 90
}
""".trim().replaceAll("\\s", ""),
iterations : 10,
numberOfCounters : 1,
numberOfCounterOperations: 0,
streaming : isStreaming
]
],
[
title : 'Load test: ParDo 2GB 100 byte records 200 times',
test : 'org.apache.beam.sdk.loadtests.ParDoLoadTest',
runner : CommonTestProperties.Runner.SPARK_STRUCTURED_STREAMING,
pipelineOptions: [
project : 'apache-beam-testing',
appName : "load_tests_Java_SparkStructuredStreaming_${jobType}_ParDo_2",
tempLocation : 'gs://temp-storage-for-perf-tests/loadtests',
publishToBigQuery : true,
bigQueryDataset : datasetName,
bigQueryTable : "java_sparkstructuredstreaming_${jobType}_ParDo_2",
influxMeasurement : "java_${jobType}_pardo_2",
publishToInfluxDB : true,
sourceOptions : """
{
"numRecords": 20000000,
"keySizeBytes": 10,
"valueSizeBytes": 90
}
""".trim().replaceAll("\\s", ""),
iterations : 200,
numberOfCounters : 1,
numberOfCounterOperations: 0,
streaming : isStreaming
]
],
[
title : 'Load test: ParDo 2GB 100 byte records 10 counters',
test : 'org.apache.beam.sdk.loadtests.ParDoLoadTest',
runner : CommonTestProperties.Runner.SPARK_STRUCTURED_STREAMING,
pipelineOptions: [
project : 'apache-beam-testing',
appName : "load_tests_Java_SparkStructuredStreaming_${jobType}_ParDo_3",
tempLocation : 'gs://temp-storage-for-perf-tests/loadtests',
publishToBigQuery : true,
bigQueryDataset : datasetName,
bigQueryTable : "java_sparkstructuredstreaming_${jobType}_ParDo_3",
influxMeasurement : "java_${jobType}_pardo_3",
publishToInfluxDB : true,
sourceOptions : """
{
"numRecords": 20000000,
"keySizeBytes": 10,
"valueSizeBytes": 90
}
""".trim().replaceAll("\\s", ""),
iterations : 1,
numberOfCounters : 1,
numberOfCounterOperations: 10,
streaming : isStreaming
]
],
[
title : 'Load test: ParDo 2GB 100 byte records 100 counters',
test : 'org.apache.beam.sdk.loadtests.ParDoLoadTest',
runner : CommonTestProperties.Runner.SPARK_STRUCTURED_STREAMING,
pipelineOptions: [
project : 'apache-beam-testing',
appName : "load_tests_Java_SparkStructuredStreaming_${jobType}_ParDo_4",
tempLocation : 'gs://temp-storage-for-perf-tests/loadtests',
publishToBigQuery : true,
bigQueryDataset : datasetName,
bigQueryTable : "java_sparkstructuredstreaming_${jobType}_ParDo_4",
influxMeasurement : "java_${jobType}_pardo_4",
publishToInfluxDB : true,
sourceOptions : """
{
"numRecords": 20000000,
"keySizeBytes": 10,
"valueSizeBytes": 90
}
""".trim().replaceAll("\\s", ""),
iterations : 1,
numberOfCounters : 1,
numberOfCounterOperations: 100,
streaming : isStreaming
]
]
].each { test -> test.pipelineOptions.putAll(additionalPipelineArgs) }
}
def batchLoadTestJob = { scope, triggeringContext ->
def datasetName = loadTestsBuilder.getBigQueryDataset('load_test', triggeringContext)
loadTestsBuilder.loadTests(scope, CommonTestProperties.SDK.JAVA, commonLoadTestConfig('batch', false, datasetName), "ParDo", "batch")
}
CronJobBuilder.cronJob('beam_LoadTests_Java_ParDo_SparkStructuredStreaming_Batch', 'H 12 * * *', this) {
additionalPipelineArgs = [
influxDatabase: InfluxDBCredentialsHelper.InfluxDBDatabaseName,
influxHost: InfluxDBCredentialsHelper.InfluxDBHostUrl,
]
batchLoadTestJob(delegate, CommonTestProperties.TriggeringContext.POST_COMMIT)
}
PhraseTriggeringPostCommitBuilder.postCommitJob(
'beam_LoadTests_Java_ParDo_SparkStructuredStreaming_Batch',
'Run Load Tests Java ParDo SparkStructuredStreaming Batch',
'Load Tests Java ParDo SparkStructuredStreaming Batch suite',
this
) {
additionalPipelineArgs = [:]
batchLoadTestJob(delegate, CommonTestProperties.TriggeringContext.PR)
}