Skip to content

Commit

Permalink
Add Load Tests Combine/ParDo SparkStructuredStreaming Batch Java work…
Browse files Browse the repository at this point in the history
…flows (#28714)

* Add Load Tests Combine/ParDo SparkStructuredStreaming Batch Java workflows

* Refactoring
  • Loading branch information
Amar3tto authored Sep 28, 2023
1 parent f824adc commit 072848f
Show file tree
Hide file tree
Showing 9 changed files with 409 additions and 0 deletions.
Original file line number Diff line number Diff line change
@@ -0,0 +1,107 @@
# Licensed to the Apache Software Foundation (ASF) under one or more
# contributor license agreements. See the NOTICE file distributed with
# this work for additional information regarding copyright ownership.
# The ASF licenses this file to You under the Apache License, Version 2.0
# (the "License"); you may not use this file except in compliance with
# the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

name: LoadTests Java Combine SparkStructuredStreaming Batch

on:
issue_comment:
types: [created]
schedule:
- cron: '15 18 * * *'
workflow_dispatch:

#Setting explicit permissions for the action to avoid the default permissions which are `write-all` in case of pull_request_target event
permissions:
actions: write
pull-requests: read
checks: read
contents: read
deployments: read
id-token: none
issues: read
discussions: read
packages: read
pages: read
repository-projects: read
security-events: read
statuses: read

# This allows a subsequently queued workflow run to interrupt previous runs
concurrency:
group: '${{ github.workflow }} @ ${{ github.event.issue.number || github.sha || github.head_ref || github.ref }}-${{ github.event.schedule || github.event.comment.body || github.event.sender.login }}'
cancel-in-progress: true

env:
GRADLE_ENTERPRISE_ACCESS_KEY: ${{ secrets.GE_ACCESS_TOKEN }}
GRADLE_ENTERPRISE_CACHE_USERNAME: ${{ secrets.GE_CACHE_USERNAME }}
GRADLE_ENTERPRISE_CACHE_PASSWORD: ${{ secrets.GE_CACHE_PASSWORD }}
beam_LoadTests_Java_Combine_SparkStructuredStreaming_Batch_test_arguments_1: ''
beam_LoadTests_Java_Combine_SparkStructuredStreaming_Batch_test_arguments_2: ''
beam_LoadTests_Java_Combine_SparkStructuredStreaming_Batch_test_arguments_3: ''

jobs:
beam_LoadTests_Java_Combine_SparkStructuredStreaming_Batch:
if: |
github.event_name == 'workflow_dispatch' ||
github.event_name == 'schedule' ||
github.event.comment.body == 'Run Load Tests Java Combine SparkStructuredStreaming Batch'
runs-on: [self-hosted, ubuntu-20.04, main]
timeout-minutes: 720
name: ${{ matrix.job_name }} (${{ matrix.job_phrase }})
strategy:
matrix:
job_name: ["beam_LoadTests_Java_Combine_SparkStructuredStreaming_Batch"]
job_phrase: ["Run Load Tests Java Combine SparkStructuredStreaming Batch"]
steps:
- uses: actions/checkout@v3
- name: Setup repository
uses: ./.github/actions/setup-action
with:
comment_phrase: ${{ matrix.job_phrase }}
github_token: ${{ secrets.GITHUB_TOKEN }}
github_job: ${{ matrix.job_name }} (${{ matrix.job_phrase }})
- name: Prepare test arguments
uses: ./.github/actions/test-arguments-action
with:
test-type: load
test-language: java
argument-file-paths: |
${{ github.workspace }}/.github/workflows/load-tests-job-configs/java_Combine_SparkStructuredStreaming_Batch_10b.txt
${{ github.workspace }}/.github/workflows/load-tests-job-configs/java_Combine_SparkStructuredStreaming_Batch_Fanout_4.txt
${{ github.workspace }}/.github/workflows/load-tests-job-configs/java_Combine_SparkStructuredStreaming_Batch_Fanout_8.txt
- name: run Combine SparkStructuredStreaming Batch Java Load Test 1 (10b records)
uses: ./.github/actions/gradle-command-self-hosted-action
with:
gradle-command: :sdks:java:testing:load-tests:run
arguments: |
-PloadTest.mainClass=org.apache.beam.sdk.loadtests.CombineLoadTest \
-Prunner=:runners:spark:3 \
'-PloadTest.args=${{ env.beam_LoadTests_Java_Combine_SparkStructuredStreaming_Batch_test_arguments_1 }}' \
- name: run Combine SparkStructuredStreaming Batch Java Load Test 2 (fanout 4)
uses: ./.github/actions/gradle-command-self-hosted-action
with:
gradle-command: :sdks:java:testing:load-tests:run
arguments: |
-PloadTest.mainClass=org.apache.beam.sdk.loadtests.CombineLoadTest \
-Prunner=:runners:spark:3 \
'-PloadTest.args=${{ env.beam_LoadTests_Java_Combine_SparkStructuredStreaming_Batch_test_arguments_2 }}' \
- name: run Combine SparkStructuredStreaming Batch Java Load Test 3 (fanout 8)
uses: ./.github/actions/gradle-command-self-hosted-action
with:
gradle-command: :sdks:java:testing:load-tests:run
arguments: |
-PloadTest.mainClass=org.apache.beam.sdk.loadtests.CombineLoadTest \
-Prunner=:runners:spark:3 \
'-PloadTest.args=${{ env.beam_LoadTests_Java_Combine_SparkStructuredStreaming_Batch_test_arguments_3 }}'
Original file line number Diff line number Diff line change
@@ -0,0 +1,117 @@
# Licensed to the Apache Software Foundation (ASF) under one or more
# contributor license agreements. See the NOTICE file distributed with
# this work for additional information regarding copyright ownership.
# The ASF licenses this file to You under the Apache License, Version 2.0
# (the "License"); you may not use this file except in compliance with
# the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

name: LoadTests Java ParDo SparkStructuredStreaming Batch

on:
issue_comment:
types: [created]
schedule:
- cron: '25 8 * * *'
workflow_dispatch:

#Setting explicit permissions for the action to avoid the default permissions which are `write-all` in case of pull_request_target event
permissions:
actions: write
pull-requests: read
checks: read
contents: read
deployments: read
id-token: none
issues: read
discussions: read
packages: read
pages: read
repository-projects: read
security-events: read
statuses: read

# This allows a subsequently queued workflow run to interrupt previous runs
concurrency:
group: '${{ github.workflow }} @ ${{ github.event.issue.number || github.sha || github.head_ref || github.ref }}-${{ github.event.schedule || github.event.comment.body || github.event.sender.login }}'
cancel-in-progress: true

env:
GRADLE_ENTERPRISE_ACCESS_KEY: ${{ secrets.GE_ACCESS_TOKEN }}
GRADLE_ENTERPRISE_CACHE_USERNAME: ${{ secrets.GE_CACHE_USERNAME }}
GRADLE_ENTERPRISE_CACHE_PASSWORD: ${{ secrets.GE_CACHE_PASSWORD }}
beam_LoadTests_Java_ParDo_SparkStructuredStreaming_Batch_test_arguments_1: ''
beam_LoadTests_Java_ParDo_SparkStructuredStreaming_Batch_test_arguments_2: ''
beam_LoadTests_Java_ParDo_SparkStructuredStreaming_Batch_test_arguments_3: ''
beam_LoadTests_Java_ParDo_SparkStructuredStreaming_Batch_test_arguments_4: ''

jobs:
beam_LoadTests_Java_ParDo_SparkStructuredStreaming_Batch:
if: |
github.event_name == 'workflow_dispatch' ||
github.event_name == 'schedule' ||
github.event.comment.body == 'Run Load Tests Java ParDo SparkStructuredStreaming Batch'
runs-on: [self-hosted, ubuntu-20.04, main]
timeout-minutes: 720
name: ${{ matrix.job_name }} (${{ matrix.job_phrase }})
strategy:
matrix:
job_name: ["beam_LoadTests_Java_ParDo_SparkStructuredStreaming_Batch"]
job_phrase: ["Run Load Tests Java ParDo SparkStructuredStreaming Batch"]
steps:
- uses: actions/checkout@v3
- name: Setup repository
uses: ./.github/actions/setup-action
with:
comment_phrase: ${{ matrix.job_phrase }}
github_token: ${{ secrets.GITHUB_TOKEN }}
github_job: ${{ matrix.job_name }} (${{ matrix.job_phrase }})
- name: Prepare test arguments
uses: ./.github/actions/test-arguments-action
with:
test-type: load
test-language: java
argument-file-paths: |
${{ github.workspace }}/.github/workflows/load-tests-job-configs/java_ParDo_SparkStructuredStreaming_Batch_10_times.txt
${{ github.workspace }}/.github/workflows/load-tests-job-configs/java_ParDo_SparkStructuredStreaming_Batch_200_times.txt
${{ github.workspace }}/.github/workflows/load-tests-job-configs/java_ParDo_SparkStructuredStreaming_Batch_10_counters.txt
${{ github.workspace }}/.github/workflows/load-tests-job-configs/java_ParDo_SparkStructuredStreaming_Batch_100_counters.txt
- name: run ParDo SparkStructuredStreaming Batch Java Load Test 1 (10 times)
uses: ./.github/actions/gradle-command-self-hosted-action
with:
gradle-command: :sdks:java:testing:load-tests:run
arguments: |
-PloadTest.mainClass=org.apache.beam.sdk.loadtests.ParDoLoadTest \
-Prunner=:runners:spark:3 \
'-PloadTest.args=${{ env.beam_LoadTests_Java_ParDo_SparkStructuredStreaming_Batch_test_arguments_1 }}' \
- name: run ParDo SparkStructuredStreaming Batch Java Load Test 2 (200 times)
uses: ./.github/actions/gradle-command-self-hosted-action
with:
gradle-command: :sdks:java:testing:load-tests:run
arguments: |
-PloadTest.mainClass=org.apache.beam.sdk.loadtests.ParDoLoadTest \
-Prunner=:runners:spark:3 \
'-PloadTest.args=${{ env.beam_LoadTests_Java_ParDo_SparkStructuredStreaming_Batch_test_arguments_2 }}' \
- name: run ParDo SparkStructuredStreaming Batch Java Load Test 3 (10 counters)
uses: ./.github/actions/gradle-command-self-hosted-action
with:
gradle-command: :sdks:java:testing:load-tests:run
arguments: |
-PloadTest.mainClass=org.apache.beam.sdk.loadtests.ParDoLoadTest \
-Prunner=:runners:spark:3 \
'-PloadTest.args=${{ env.beam_LoadTests_Java_ParDo_SparkStructuredStreaming_Batch_test_arguments_3 }}' \
- name: run ParDo SparkStructuredStreaming Batch Java Load Test 4 (100 counters)
uses: ./.github/actions/gradle-command-self-hosted-action
with:
gradle-command: :sdks:java:testing:load-tests:run
arguments: |
-PloadTest.mainClass=org.apache.beam.sdk.loadtests.ParDoLoadTest \
-Prunner=:runners:spark:3 \
'-PloadTest.args=${{ env.beam_LoadTests_Java_ParDo_SparkStructuredStreaming_Batch_test_arguments_4 }}'
Original file line number Diff line number Diff line change
@@ -0,0 +1,27 @@
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

--appName=load_tests_Java_SparkStructuredStreaming_batch_Combine_1
--tempLocation=gs://temp-storage-for-perf-tests/loadtests
--influxMeasurement=java_batch_combine_1
--publishToInfluxDB=true
--sourceOptions={"numRecords":200000000,"keySizeBytes":1,"valueSizeBytes":9}
--fanout=1
--iterations=1
--topCount=20
--perKeyCombiner=TOP_LARGEST
--streaming=false
--runner=SparkStructuredStreamingRunner
Original file line number Diff line number Diff line change
@@ -0,0 +1,27 @@
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

--appName=load_tests_Java_SparkStructuredStreaming_batch_Combine_2
--tempLocation=gs://temp-storage-for-perf-tests/loadtests
--influxMeasurement=java_batch_combine_2
--publishToInfluxDB=true
--sourceOptions={"numRecords":5000000,"keySizeBytes":10,"valueSizeBytes":90}
--fanout=4
--iterations=1
--topCount=20
--perKeyCombiner=TOP_LARGEST
--streaming=false
--runner=SparkStructuredStreamingRunner
Original file line number Diff line number Diff line change
@@ -0,0 +1,27 @@
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

--appName=load_tests_Java_SparkStructuredStreaming_batch_Combine_3
--tempLocation=gs://temp-storage-for-perf-tests/loadtests
--influxMeasurement=java_batch_combine_3
--publishToInfluxDB=true
--sourceOptions={"numRecords":2500000,"keySizeBytes":10,"valueSizeBytes":90}
--fanout=8
--iterations=1
--topCount=20
--perKeyCombiner=TOP_LARGEST
--streaming=false
--runner=SparkStructuredStreamingRunner
Original file line number Diff line number Diff line change
@@ -0,0 +1,26 @@
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

--appName=load_tests_Java_SparkStructuredStreaming_batch_ParDo_4
--tempLocation=gs://temp-storage-for-perf-tests/loadtests
--influxMeasurement=java_batch_pardo_4
--publishToInfluxDB=true
--sourceOptions={"numRecords":20000000,"keySizeBytes":10,"valueSizeBytes":90}
--iterations=1
--numberOfCounters=1
--numberOfCounterOperations=100
--streaming=false
--runner=SparkStructuredStreamingRunner
Original file line number Diff line number Diff line change
@@ -0,0 +1,26 @@
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

--appName=load_tests_Java_SparkStructuredStreaming_batch_ParDo_3
--tempLocation=gs://temp-storage-for-perf-tests/loadtests
--influxMeasurement=java_batch_pardo_3
--publishToInfluxDB=true
--sourceOptions={"numRecords":20000000,"keySizeBytes":10,"valueSizeBytes":90}
--iterations=1
--numberOfCounters=1
--numberOfCounterOperations=10
--streaming=false
--runner=SparkStructuredStreamingRunner
Original file line number Diff line number Diff line change
@@ -0,0 +1,26 @@
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

--appName=load_tests_Java_SparkStructuredStreaming_batch_ParDo_1
--tempLocation=gs://temp-storage-for-perf-tests/loadtests
--influxMeasurement=java_batch_pardo_1
--publishToInfluxDB=true
--sourceOptions={"numRecords":20000000,"keySizeBytes":10,"valueSizeBytes":90}
--iterations=10
--numberOfCounters=1
--numberOfCounterOperations=0
--streaming=false
--runner=SparkStructuredStreamingRunner
Loading

0 comments on commit 072848f

Please sign in to comment.