From 87e9ad60f636d53c0eaa8a4b51a98b1bcb2f809c Mon Sep 17 00:00:00 2001 From: aleksandr-dudko Date: Mon, 18 Sep 2023 17:11:15 +0400 Subject: [PATCH 1/2] Add GitHub Workflow Replacements for job_PerformanceTests_BiqQueryIO_Read_Python and job_PerformanceTests_BiqQueryIO_Write_Python_Batch --- ...erformanceTests_BiqQueryIO_Read_Python.yml | 92 +++++++++++++++++++ ...nceTests_BiqQueryIO_Write_Python_Batch.yml | 92 +++++++++++++++++++ ...erformanceTests_BiqQueryIO_Read_Python.txt | 33 +++++++ ...rformanceTests_BiqQueryIO_Write_Python.txt | 33 +++++++ 4 files changed, 250 insertions(+) create mode 100644 .github/workflows/beam_PerformanceTests_BiqQueryIO_Read_Python.yml create mode 100644 .github/workflows/beam_PerformanceTests_BiqQueryIO_Write_Python_Batch.yml create mode 100644 .github/workflows/performance-tests-job-configs/config_PerformanceTests_BiqQueryIO_Read_Python.txt create mode 100644 .github/workflows/performance-tests-job-configs/config_PerformanceTests_BiqQueryIO_Write_Python.txt diff --git a/.github/workflows/beam_PerformanceTests_BiqQueryIO_Read_Python.yml b/.github/workflows/beam_PerformanceTests_BiqQueryIO_Read_Python.yml new file mode 100644 index 000000000000..60821e9ea1c0 --- /dev/null +++ b/.github/workflows/beam_PerformanceTests_BiqQueryIO_Read_Python.yml @@ -0,0 +1,92 @@ +# Licensed to the Apache Software Foundation (ASF) under one or more +# contributor license agreements. See the NOTICE file distributed with +# this work for additional information regarding copyright ownership. +# The ASF licenses this file to You under the Apache License, Version 2.0 +# (the "License"); you may not use this file except in compliance with +# the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +name: Performance BigQueryIO Read Python + +on: + issue_comment: + types: [created] + schedule: + - cron: '0 2 * * *' + workflow_dispatch: + +#Setting explicit permissions for the action to avoid the default permissions which are `write-all` in case of pull_request_target event +permissions: + actions: write + pull-requests: write + checks: write + contents: read + deployments: read + id-token: none + issues: write + discussions: read + packages: read + pages: read + repository-projects: read + security-events: read + statuses: read + +# This allows a subsequently queued workflow run to interrupt previous runs +concurrency: + group: '${{ github.workflow }} @ ${{ github.event.issue.number || github.sha || github.head_ref || github.ref }}-${{ github.event.schedule || github.event.comment.body || github.event.sender.login }}' + cancel-in-progress: true + +env: + GRADLE_ENTERPRISE_ACCESS_KEY: ${{ secrets.GE_ACCESS_TOKEN }} + GRADLE_ENTERPRISE_CACHE_USERNAME: ${{ secrets.GE_CACHE_USERNAME }} + GRADLE_ENTERPRISE_CACHE_PASSWORD: ${{ secrets.GE_CACHE_PASSWORD }} + +jobs: + beam_PerformanceTests_BiqQueryIO_Read_Python: + if: | + github.event_name == 'workflow_dispatch' || + github.event_name == 'schedule' || + github.event.comment.body == 'Run BigQueryIO Read Performance Test Python' + runs-on: [self-hosted, ubuntu-20.04, main] + timeout-minutes: 240 + name: ${{ matrix.job_name }} (${{ matrix.job_phrase }}) + strategy: + matrix: + job_name: ["beam_PerformanceTests_BiqQueryIO_Read_Python"] + job_phrase: ["Run BigQueryIO Read Performance Test Python"] + steps: + - uses: actions/checkout@v3 + - name: Setup repository + uses: ./.github/actions/setup-action + with: + comment_phrase: ${{ matrix.job_phrase }} + github_token: ${{ secrets.GITHUB_TOKEN }} + github_job: ${{ matrix.job_name }} (${{ matrix.job_phrase }}) + - name: Install Python + uses: actions/setup-python@v4 + with: + python-version: '3.8' + - name: Prepare config + id: set_config + shell: bash + run: | + CURDATE=$(date '+%m%d%H%M%S' --utc) + CURCONFIG=$(grep -v "^#.*" ./.github/workflows/performance-tests-job-configs/config_PerformanceTests_BiqQueryIO_Read_Python.txt | tr '\n' ' ') + CONFIGWITHDATE=$(echo "${CURCONFIG/bqio_read_python_/bqio_read_python_$CURDATE}") + echo "prepared_config=$CONFIGWITHDATE" >> $GITHUB_OUTPUT + - name: run BigQueryIO Read Python Performance Test + uses: ./.github/actions/gradle-command-self-hosted-action + with: + gradle-command: :sdks:python:apache_beam:testing:load_tests:run + arguments: | + -PloadTest.mainClass=apache_beam.io.gcp.bigquery_read_perf_test \ + -PpythonVersion=3.8 \ + -Prunner=DataflowRunner \ + '-PloadTest.args=${{steps.set_config.outputs.prepared_config}}' \ No newline at end of file diff --git a/.github/workflows/beam_PerformanceTests_BiqQueryIO_Write_Python_Batch.yml b/.github/workflows/beam_PerformanceTests_BiqQueryIO_Write_Python_Batch.yml new file mode 100644 index 000000000000..3b8a74aae7e7 --- /dev/null +++ b/.github/workflows/beam_PerformanceTests_BiqQueryIO_Write_Python_Batch.yml @@ -0,0 +1,92 @@ +# Licensed to the Apache Software Foundation (ASF) under one or more +# contributor license agreements. See the NOTICE file distributed with +# this work for additional information regarding copyright ownership. +# The ASF licenses this file to You under the Apache License, Version 2.0 +# (the "License"); you may not use this file except in compliance with +# the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +name: Performance BigQueryIO Write Python Batch + +on: + issue_comment: + types: [created] + schedule: + - cron: '0 1 * * *' + workflow_dispatch: + +#Setting explicit permissions for the action to avoid the default permissions which are `write-all` in case of pull_request_target event +permissions: + actions: write + pull-requests: write + checks: write + contents: read + deployments: read + id-token: none + issues: write + discussions: read + packages: read + pages: read + repository-projects: read + security-events: read + statuses: read + +# This allows a subsequently queued workflow run to interrupt previous runs +concurrency: + group: '${{ github.workflow }} @ ${{ github.event.issue.number || github.sha || github.head_ref || github.ref }}-${{ github.event.schedule || github.event.comment.body || github.event.sender.login }}' + cancel-in-progress: true + +env: + GRADLE_ENTERPRISE_ACCESS_KEY: ${{ secrets.GE_ACCESS_TOKEN }} + GRADLE_ENTERPRISE_CACHE_USERNAME: ${{ secrets.GE_CACHE_USERNAME }} + GRADLE_ENTERPRISE_CACHE_PASSWORD: ${{ secrets.GE_CACHE_PASSWORD }} + +jobs: + beam_PerformanceTests_BiqQueryIO_Write_Python_Batch: + if: | + github.event_name == 'workflow_dispatch' || + github.event_name == 'schedule' || + github.event.comment.body == 'Run BigQueryIO Write Performance Test Python' + runs-on: [self-hosted, ubuntu-20.04, main] + timeout-minutes: 240 + name: ${{ matrix.job_name }} (${{ matrix.job_phrase }}) + strategy: + matrix: + job_name: ["beam_PerformanceTests_BiqQueryIO_Write_Python_Batch"] + job_phrase: ["Run BigQueryIO Write Performance Test Python"] + steps: + - uses: actions/checkout@v3 + - name: Setup repository + uses: ./.github/actions/setup-action + with: + comment_phrase: ${{ matrix.job_phrase }} + github_token: ${{ secrets.GITHUB_TOKEN }} + github_job: ${{ matrix.job_name }} (${{ matrix.job_phrase }}) + - name: Install Python + uses: actions/setup-python@v4 + with: + python-version: '3.8' + - name: Prepare config + id: set_config + shell: bash + run: | + CURDATE=$(date '+%m%d%H%M%S' --utc) + CURCONFIG=$(grep -v "^#.*" ./.github/workflows/performance-tests-job-configs/config_PerformanceTests_BiqQueryIO_Write_Python.txt | tr '\n' ' ') + CONFIGWITHDATE=$(echo "${CURCONFIG/bqio_write_python_/bqio_write_python_$CURDATE}") + echo "prepared_config=$CONFIGWITHDATE" >> $GITHUB_OUTPUT + - name: run BigQueryIO Write Batch Python Performance Test + uses: ./.github/actions/gradle-command-self-hosted-action + with: + gradle-command: :sdks:python:apache_beam:testing:load_tests:run + arguments: | + -PloadTest.mainClass=apache_beam.io.gcp.bigquery_write_perf_test \ + -PpythonVersion=3.8 \ + -Prunner=DataflowRunner \ + '-PloadTest.args=${{steps.set_config.outputs.prepared_config}}' \ No newline at end of file diff --git a/.github/workflows/performance-tests-job-configs/config_PerformanceTests_BiqQueryIO_Read_Python.txt b/.github/workflows/performance-tests-job-configs/config_PerformanceTests_BiqQueryIO_Read_Python.txt new file mode 100644 index 000000000000..facf8b91ddb4 --- /dev/null +++ b/.github/workflows/performance-tests-job-configs/config_PerformanceTests_BiqQueryIO_Read_Python.txt @@ -0,0 +1,33 @@ +############################################################################### +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +############################################################################### +--job_name=performance-tests-bqio-read-python-10gb0917155348 +--project=apache-beam-testing +--region=us-central1 +--temp_location=gs://temp-storage-for-perf-tests/loadtests +--input_dataset=beam_performance +--input_table=bqio_read_10GB +--publish_to_big_query=true +--metrics_dataset=beam_performance +--metrics_table=bqio_read_10GB_results +--influx_measurement=python_bqio_read_10GB_results +--influx_db_name=beam_test_metrics +--influx_hostname=http://10.128.0.96:8086 +--input_options=''{\\"num_records\\":10485760,\\"key_size\\":1,\\"value_size\\":1024,\\"algorithm\\":\\"lcg\\"}'' +--num_****s=5 +--autoscaling_algorithm=NONE +--runner=DataflowRunner \ No newline at end of file diff --git a/.github/workflows/performance-tests-job-configs/config_PerformanceTests_BiqQueryIO_Write_Python.txt b/.github/workflows/performance-tests-job-configs/config_PerformanceTests_BiqQueryIO_Write_Python.txt new file mode 100644 index 000000000000..b8c6bd9265f0 --- /dev/null +++ b/.github/workflows/performance-tests-job-configs/config_PerformanceTests_BiqQueryIO_Write_Python.txt @@ -0,0 +1,33 @@ +############################################################################### +# Licensed to the Apache Software Foundation (ASF) under one +# or more contributor license agreements. See the NOTICE file +# distributed with this work for additional information +# regarding copyright ownership. The ASF licenses this file +# to you under the Apache License, Version 2.0 (the +# "License"); you may not use this file except in compliance +# with the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +############################################################################### +--job_name=performance-tests-bqio-write-python-batch-10gb0917155348 +--project=apache-beam-testing +--region=us-central1 +--temp_location=gs://temp-storage-for-perf-tests/loadtests +--output_dataset=beam_performance +--output_table=bqio_write_10GB +--publish_to_big_query=true +--metrics_dataset=beam_performance +--metrics_table=bqio_write_10GB_results +--influx_measurement=python_bqio_write_10GB_results +--influx_db_name=beam_test_metrics +--influx_hostname=http://10.128.0.96:8086 +--input_options=''{\\"num_records\\":10485760,\\"key_size\\":1,\\"value_size\\":1024,\\"algorithm\\":\\"lcg\\"}'' +--num_****s=5 +--autoscaling_algorithm=NONE +--runner=DataflowRunner \ No newline at end of file From 7c830271945bcc45e44074685b2ef0e35f2917c9 Mon Sep 17 00:00:00 2001 From: aleksandr-dudko Date: Wed, 20 Sep 2023 11:28:57 +0400 Subject: [PATCH 2/2] Add comments for set_config --- .../beam_PerformanceTests_BiqQueryIO_Read_Python.yml | 5 +++++ .../beam_PerformanceTests_BiqQueryIO_Write_Python_Batch.yml | 5 +++++ 2 files changed, 10 insertions(+) diff --git a/.github/workflows/beam_PerformanceTests_BiqQueryIO_Read_Python.yml b/.github/workflows/beam_PerformanceTests_BiqQueryIO_Read_Python.yml index 60821e9ea1c0..224689ee9086 100644 --- a/.github/workflows/beam_PerformanceTests_BiqQueryIO_Read_Python.yml +++ b/.github/workflows/beam_PerformanceTests_BiqQueryIO_Read_Python.yml @@ -73,13 +73,18 @@ jobs: uses: actions/setup-python@v4 with: python-version: '3.8' + # This code block prepares configuration data for a task. - name: Prepare config id: set_config shell: bash run: | + # Capture the current date and time in a specific format CURDATE=$(date '+%m%d%H%M%S' --utc) + # Reads the configurations file and exclude lines starting with # and then remove line breaks CURCONFIG=$(grep -v "^#.*" ./.github/workflows/performance-tests-job-configs/config_PerformanceTests_BiqQueryIO_Read_Python.txt | tr '\n' ' ') + # Appends the value of CURDATE to the original configuration CONFIGWITHDATE=$(echo "${CURCONFIG/bqio_read_python_/bqio_read_python_$CURDATE}") + # Assigns $CONFIGWITHDATE to a variable named prepared_config echo "prepared_config=$CONFIGWITHDATE" >> $GITHUB_OUTPUT - name: run BigQueryIO Read Python Performance Test uses: ./.github/actions/gradle-command-self-hosted-action diff --git a/.github/workflows/beam_PerformanceTests_BiqQueryIO_Write_Python_Batch.yml b/.github/workflows/beam_PerformanceTests_BiqQueryIO_Write_Python_Batch.yml index 3b8a74aae7e7..24cd1b25ca73 100644 --- a/.github/workflows/beam_PerformanceTests_BiqQueryIO_Write_Python_Batch.yml +++ b/.github/workflows/beam_PerformanceTests_BiqQueryIO_Write_Python_Batch.yml @@ -73,13 +73,18 @@ jobs: uses: actions/setup-python@v4 with: python-version: '3.8' + # This code block prepares configuration data for a task. - name: Prepare config id: set_config shell: bash run: | + # capture the current date and time in a specific format CURDATE=$(date '+%m%d%H%M%S' --utc) + # reads the configurations file and exclude lines starting with # and then remove line breaks CURCONFIG=$(grep -v "^#.*" ./.github/workflows/performance-tests-job-configs/config_PerformanceTests_BiqQueryIO_Write_Python.txt | tr '\n' ' ') + # appends the value of CURDATE to the original configuration CONFIGWITHDATE=$(echo "${CURCONFIG/bqio_write_python_/bqio_write_python_$CURDATE}") + # assigns $CONFIGWITHDATE to a variable named prepared_config echo "prepared_config=$CONFIGWITHDATE" >> $GITHUB_OUTPUT - name: run BigQueryIO Write Batch Python Performance Test uses: ./.github/actions/gradle-command-self-hosted-action